-
Notifications
You must be signed in to change notification settings - Fork 0
/
experiments.txt
231 lines (199 loc) · 32.2 KB
/
experiments.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
#
# Before fixing sign mistake in EFE
#
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=VAE seed=1 env.difficulty="hard"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=HMM seed=1 env.difficulty="hard"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DQN seed=1 env.difficulty="hard"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=1 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=2 env.difficulty="hard" agent.g_value="efe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=3 env.difficulty="hard" agent.g_value="efe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=4 env.difficulty="hard" agent.g_value="efe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=5 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=6 env.difficulty="hard" agent.g_value="befe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=7 env.difficulty="hard" agent.g_value="befe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=8 env.difficulty="hard" agent.g_value="befe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=9 env.difficulty="hard" agent.g_value="befe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=10 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=11 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=12 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=13 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=14 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=15 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=16 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=17 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=18 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=19 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=20 env.difficulty="hard" agent.g_value="efe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=21 env.difficulty="hard" agent.g_value="efe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=22 env.difficulty="hard" agent.g_value="efe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=23 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=24 env.difficulty="hard" agent.g_value="befe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=25 env.difficulty="hard" agent.g_value="befe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=26 env.difficulty="hard" agent.g_value="befe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=27 env.difficulty="hard" agent.g_value="befe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=28 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=29 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=30 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=31 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=32 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=33 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=34 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=35 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_2LS seed=36 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=37 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=38 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=39 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=40 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=41 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=42 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=43 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=44 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=45 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=46 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=47 env.difficulty="hard" agent.g_value="efe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=48 env.difficulty="hard" agent.g_value="efe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=49 env.difficulty="hard" agent.g_value="efe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=50 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=51 env.difficulty="hard" agent.g_value="befe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=52 env.difficulty="hard" agent.g_value="befe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=53 env.difficulty="hard" agent.g_value="befe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_C2LS seed=54 env.difficulty="hard" agent.g_value="befe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=55 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=56 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=57 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=58 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=59 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=60 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=61 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=62 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=63 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=64 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=65 env.difficulty="hard" agent.g_value="efe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=66 env.difficulty="hard" agent.g_value="efe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=67 env.difficulty="hard" agent.g_value="efe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=68 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=69 env.difficulty="hard" agent.g_value="befe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=70 env.difficulty="hard" agent.g_value="befe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=71 env.difficulty="hard" agent.g_value="befe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM_CN2LS seed=72 env.difficulty="hard" agent.g_value="befe_3"
#
# After fixing sign mistake in EFE
#
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=73 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=74 env.difficulty="hard" agent.g_value="efe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=75 env.difficulty="hard" agent.g_value="efe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=76 env.difficulty="hard" agent.g_value="efe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=77 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=78 env.difficulty="hard" agent.g_value="befe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=79 env.difficulty="hard" agent.g_value="befe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=80 env.difficulty="hard" agent.g_value="befe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=81 env.difficulty="hard" agent.g_value="befe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=82 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=83 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=84 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=85 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=86 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=87 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=88 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=89 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=90 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=91 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=92 env.difficulty="hard" agent.g_value="efe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=93 env.difficulty="hard" agent.g_value="efe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=94 env.difficulty="hard" agent.g_value="efe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=95 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=96 env.difficulty="hard" agent.g_value="befe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=97 env.difficulty="hard" agent.g_value="befe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=98 env.difficulty="hard" agent.g_value="befe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=99 env.difficulty="hard" agent.g_value="befe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=100 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=101 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=102 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=103 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=104 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=105 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=106 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=107 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=108 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=109 env.difficulty="hard" agent.g_value="reward" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=110 env.difficulty="hard" agent.g_value="efe_0" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=111 env.difficulty="hard" agent.g_value="efe_1" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=112 env.difficulty="hard" agent.g_value="efe_2" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=113 env.difficulty="hard" agent.g_value="efe_3" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=114 env.difficulty="hard" agent.g_value="befe_0" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=115 env.difficulty="hard" agent.g_value="befe_1" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=116 env.difficulty="hard" agent.g_value="befe_2" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=117 env.difficulty="hard" agent.g_value="befe_3" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=118 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=119 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=120 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=121 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=122 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=123 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=124 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=125 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=126 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=127 env.difficulty="hard" agent.g_value="reward" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=128 env.difficulty="hard" agent.g_value="efe_0" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=129 env.difficulty="hard" agent.g_value="efe_1" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=130 env.difficulty="hard" agent.g_value="efe_2" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=131 env.difficulty="hard" agent.g_value="efe_3" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=132 env.difficulty="hard" agent.g_value="befe_0" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=133 env.difficulty="hard" agent.g_value="befe_1" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=134 env.difficulty="hard" agent.g_value="befe_2" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=135 env.difficulty="hard" agent.g_value="befe_3" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=136 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=137 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=138 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=139 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=140 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=141 env.difficulty="hard" agent.g_value="befe_0" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=142 env.difficulty="hard" agent.g_value="befe_1" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=143 env.difficulty="hard" agent.g_value="befe_2" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=CHMM seed=144 env.difficulty="hard" agent.g_value="befe_3" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=145 env.difficulty="hard" agent.g_value="reward" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=146 env.difficulty="hard" agent.g_value="efe_0" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=147 env.difficulty="hard" agent.g_value="efe_1" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=148 env.difficulty="hard" agent.g_value="efe_2" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=149 env.difficulty="hard" agent.g_value="efe_3" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=150 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=151 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=152 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=153 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=154 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=155 env.difficulty="hard" agent.g_value="reward" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=156 env.difficulty="hard" agent.g_value="efe_0" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=157 env.difficulty="hard" agent.g_value="efe_1" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=158 env.difficulty="hard" agent.g_value="efe_2" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=159 env.difficulty="hard" agent.g_value="efe_3" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=160 env.difficulty="hard" agent.g_value="reward" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=161 env.difficulty="hard" agent.g_value="efe_0" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=162 env.difficulty="hard" agent.g_value="efe_1" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=163 env.difficulty="hard" agent.g_value="efe_2" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=DAI seed=164 env.difficulty="hard" agent.g_value="efe_3" agent.efe_loss_update_encoder=True agent.action_selection=bestAction
#
# Additional experiments
#
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=165 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=166 env.difficulty="hard" agent.g_value="efe_0"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=167 env.difficulty="hard" agent.g_value="efe_1"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=168 env.difficulty="hard" agent.g_value="efe_2"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=169 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=170 env.difficulty="hard" agent.g_value="reward" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=171 env.difficulty="hard" agent.g_value="efe_0" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=172 env.difficulty="hard" agent.g_value="efe_1" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=173 env.difficulty="hard" agent.g_value="efe_2" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=174 env.difficulty="hard" agent.g_value="efe_3" agent.action_selection=bestAction
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=175 env.difficulty="hard" agent.g_value="reward" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=176 env.difficulty="hard" agent.g_value="efe_0" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=177 env.difficulty="hard" agent.g_value="efe_1" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=178 env.difficulty="hard" agent.g_value="efe_2" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu fixed_chmm_training.sh seed=179 env.difficulty="hard" agent.g_value="efe_3" agent.action_selection=softmax
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=201 env.difficulty="hard" agent.g_value="efe_3" agent.beta=1
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=202 env.difficulty="hard" agent.g_value="efe_3"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=200 env.difficulty="hard" agent.g_value="reward"
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=203 env.difficulty="hard" agent.g_value="efe_3" agent.beta_rate=0.5 agent.n_steps_beta_incr=200000
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=204 env.difficulty="hard" agent.g_value="efe_3" agent.beta_rate=0.25 agent.n_steps_beta_incr=200000
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=205 env.difficulty="hard" agent.g_value="efe_3" agent.beta_rate=0.15 agent.n_steps_beta_incr=200000
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=206 env.difficulty="hard" agent.g_value="efe_3" agent.beta_rate=0.05 agent.n_steps_beta_incr=200000
sbatch -p gpu --mem=10G --gres-flags=disable-binding --gres=gpu env_training.sh agent=AnalysisCHMM seed=207 env.difficulty="hard" agent.g_value="efe_3" agent.beta_rate=0.01 agent.n_steps_beta_incr=200000