Skip to content

Commit a8f47a4

Browse files
feat(mathy_alpha_sm): updated multi-task model
1 parent fc27522 commit a8f47a4

File tree

3 files changed

+12
-12
lines changed

3 files changed

+12
-12
lines changed

libraries/mathy_alpha_sm/mathy_alpha_sm/model.config.json

Lines changed: 12 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -6,47 +6,47 @@
66
"author": "Justin DuJardin",
77
"email": "justin@dujardinconsulting.com",
88
"url": "https://mathy.ai",
9-
"mathy_version": ">=0.0.0,<1.0.0",
9+
"mathy_version": "0.3.5",
1010
"units": 512,
1111
"embedding_units": 512,
1212
"lstm_units": 128,
1313
"topics": [
14-
"poly-combine"
14+
"poly"
1515
],
16-
"difficulty": null,
17-
"model_dir": "/var/folders/q3/j42n3r692gb2yl9cp1ncs3q00000gn/T/tmpa8tndnqz",
16+
"difficulty": "easy",
17+
"model_dir": "./training/alpha_piv_new",
1818
"model_name": "model",
1919
"init_model_from": null,
2020
"train": false,
2121
"verbose": false,
2222
"lr": 0.0003,
23-
"max_eps": 1,
23+
"max_eps": 15000,
2424
"summary_interval": 100,
2525
"gamma": 0.99,
26-
"num_workers": 1,
26+
"num_workers": 4,
2727
"td_lambda": 0.2,
2828
"print_training": false,
2929
"print_mode": "terminal",
3030
"use_term_order": false,
3131
"use_tree_complexity": false,
3232
"use_grouping_control": true,
33-
"clip_grouping_control": false,
33+
"clip_grouping_control": true,
3434
"use_env_features": false,
3535
"use_node_values": true,
3636
"update_gradients_every": 64,
3737
"num_thinking_steps_begin": 3,
38-
"mcts_sims": 200,
39-
"worker_wait": 0.01,
38+
"mcts_sims": 10,
39+
"worker_wait": 0.1,
4040
"profile": false,
4141
"action_strategy": "a3c",
4242
"main_worker_use_epsilon": false,
4343
"e_greedy_min": 0.01,
4444
"e_greedy_max": 0.1,
45-
"entropy_loss_scaling": 1,
45+
"entropy_loss_scaling": 0.05,
4646
"normalize_entropy_loss": true,
47-
"aux_tasks_weight_scale": 1,
47+
"aux_tasks_weight_scale": 0.1,
4848
"teacher_start_evaluations_at_episode": 50,
4949
"teacher_evaluation_steps": 20,
5050
"teacher_promote_wins": 0.95,
5151
"teacher_demote_wins": 0.6
52-
}
52+
}
-6.18 KB
Binary file not shown.
0 Bytes
Binary file not shown.

0 commit comments

Comments
 (0)