66 "author" : " Justin DuJardin" ,
77 "email" : " justin@dujardinconsulting.com" ,
88 "url" : " https://mathy.ai" ,
9- "mathy_version" : " >=0.0.0,<1.0.0 " ,
9+ "mathy_version" : " 0.3.5 " ,
1010 "units" : 512 ,
1111 "embedding_units" : 512 ,
1212 "lstm_units" : 128 ,
1313 "topics" : [
14- " poly-combine "
14+ " poly"
1515 ],
16- "difficulty" : null ,
17- "model_dir" : " /var/folders/q3/j42n3r692gb2yl9cp1ncs3q00000gn/T/tmpa8tndnqz " ,
16+ "difficulty" : " easy " ,
17+ "model_dir" : " ./training/alpha_piv_new " ,
1818 "model_name" : " model" ,
1919 "init_model_from" : null ,
2020 "train" : false ,
2121 "verbose" : false ,
2222 "lr" : 0.0003 ,
23- "max_eps" : 1 ,
23+ "max_eps" : 15000 ,
2424 "summary_interval" : 100 ,
2525 "gamma" : 0.99 ,
26- "num_workers" : 1 ,
26+ "num_workers" : 4 ,
2727 "td_lambda" : 0.2 ,
2828 "print_training" : false ,
2929 "print_mode" : " terminal" ,
3030 "use_term_order" : false ,
3131 "use_tree_complexity" : false ,
3232 "use_grouping_control" : true ,
33- "clip_grouping_control" : false ,
33+ "clip_grouping_control" : true ,
3434 "use_env_features" : false ,
3535 "use_node_values" : true ,
3636 "update_gradients_every" : 64 ,
3737 "num_thinking_steps_begin" : 3 ,
38- "mcts_sims" : 200 ,
39- "worker_wait" : 0.01 ,
38+ "mcts_sims" : 10 ,
39+ "worker_wait" : 0.1 ,
4040 "profile" : false ,
4141 "action_strategy" : " a3c" ,
4242 "main_worker_use_epsilon" : false ,
4343 "e_greedy_min" : 0.01 ,
4444 "e_greedy_max" : 0.1 ,
45- "entropy_loss_scaling" : 1 ,
45+ "entropy_loss_scaling" : 0.05 ,
4646 "normalize_entropy_loss" : true ,
47- "aux_tasks_weight_scale" : 1 ,
47+ "aux_tasks_weight_scale" : 0. 1 ,
4848 "teacher_start_evaluations_at_episode" : 50 ,
4949 "teacher_evaluation_steps" : 20 ,
5050 "teacher_promote_wins" : 0.95 ,
5151 "teacher_demote_wins" : 0.6
52- }
52+ }
0 commit comments