Skip to content

Commit 02e63e2

Browse files
feat(mathy_alpha_sm): more stable recurrent model
- trained on multiple poly/complex/binomial tasks
1 parent cb2da5f commit 02e63e2

File tree

3 files changed

+54
-52
lines changed

3 files changed

+54
-52
lines changed
Lines changed: 54 additions & 52 deletions
Original file line numberDiff line numberDiff line change
@@ -1,57 +1,59 @@
11
{
2-
"name": "mathy_alpha_sm",
3-
"version": "0.6.7",
4-
"description": "Mathy.ai multi-task small model",
5-
"license": "CC BY-SA 3.0",
6-
"author": "Justin DuJardin",
7-
"email": "justin@dujardinconsulting.com",
8-
"url": "https://mathy.ai",
9-
"mathy_version": ">=0.6.2,<1.0.0",
10-
"prediction_window_size": 7,
11-
"use_lstm": true,
12-
"units": 512,
13-
"embedding_units": 512,
14-
"lstm_units": 128,
15-
"topics": [
2+
"name":"mathy_alpha_sm",
3+
"version":"0.6.7",
4+
"description":"Mathy.ai multi-task small model",
5+
"license":"CC BY-SA 3.0",
6+
"author":"Justin DuJardin",
7+
"email":"justin@dujardinconsulting.com",
8+
"url":"https://mathy.ai",
9+
"mathy_version":">=0.6.7,<1.0.0",
10+
"prediction_window_size":16,
11+
"dropout":0.2,
12+
"units":256,
13+
"embedding_units":256,
14+
"lstm_units":128,
15+
"topics":[
1616
"poly",
17+
"poly-combine",
1718
"complex",
18-
"binomial"
19+
"binomial",
20+
"poly-blockers"
1921
],
20-
"difficulty": null,
21-
"model_name": "model",
22-
"init_model_from": null,
23-
"train": false,
24-
"verbose": true,
25-
"lr": 0.001,
26-
"max_eps": 5000,
27-
"summary_interval": 100,
28-
"gamma": 0.99,
29-
"num_workers": 4,
30-
"td_lambda": 0.2,
31-
"print_training": false,
32-
"print_model_call_times": false,
33-
"print_mode": "terminal",
34-
"normalization_style": "layer",
35-
"use_term_order": false,
36-
"use_tree_complexity": false,
37-
"use_grouping_control": false,
38-
"clip_grouping_control": true,
39-
"use_env_features": true,
40-
"use_node_values": true,
41-
"update_gradients_every": 6,
42-
"num_thinking_steps_begin": 3,
43-
"mcts_sims": 10,
44-
"worker_wait": 0.01,
45-
"profile": false,
46-
"action_strategy": "a3c",
47-
"main_worker_use_epsilon": false,
48-
"e_greedy_min": 0.01,
49-
"e_greedy_max": 0.3,
50-
"entropy_loss_scaling": 0.05,
51-
"normalize_entropy_loss": true,
52-
"aux_tasks_weight_scale": 0.1,
53-
"teacher_start_evaluations_at_episode": 50,
54-
"teacher_evaluation_steps": 5,
55-
"teacher_promote_wins": 0.95,
56-
"teacher_demote_wins": 0.6
22+
"difficulty":null,
23+
"model_dir":"mathy_alpha_sm",
24+
"model_name":"model",
25+
"init_model_from":null,
26+
"train":false,
27+
"verbose":true,
28+
"lr_initial":0.01,
29+
"lr_decay_steps":100,
30+
"lr_decay_rate":0.96,
31+
"lr_decay_staircase":true,
32+
"max_eps":15000,
33+
"summary_interval":100,
34+
"gamma":0.99,
35+
"num_workers":4,
36+
"td_lambda":0.2,
37+
"print_training":false,
38+
"print_model_call_times":false,
39+
"print_mode":"terminal",
40+
"normalization_style":"layer",
41+
"use_grouping_control":false,
42+
"clip_grouping_control":true,
43+
"update_gradients_every":8,
44+
"mcts_sims":10,
45+
"worker_wait":0.01,
46+
"profile":false,
47+
"action_strategy":"a3c",
48+
"main_worker_use_epsilon":false,
49+
"e_greedy_min":0.01,
50+
"e_greedy_max":0.1,
51+
"entropy_loss_scaling":0.05,
52+
"normalize_entropy_loss":true,
53+
"normalize_pi_loss":true,
54+
"aux_tasks_weight_scale":1.0,
55+
"teacher_start_evaluations_at_episode":50,
56+
"teacher_evaluation_steps":20,
57+
"teacher_promote_wins":0.95,
58+
"teacher_demote_wins":0.5
5759
}
-2.91 MB
Binary file not shown.
-5.81 MB
Binary file not shown.

0 commit comments

Comments
 (0)