-
Notifications
You must be signed in to change notification settings - Fork 1
/
rl.sig
75 lines (60 loc) · 1.85 KB
/
rl.sig
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
signature rl =
sig
include Abbrev
type seq = kernel.seq
type prog = kernel.prog
type tnn = mlTreeNeuralNetwork.tnn
type 'a set = 'a Redblackset.set
type ('a,'b) dict = ('a,'b) Redblackmap.dict
type move = int
type board = prog list
type player = (board,move) mcts.player
(* globals *)
val ncore : int ref
val ntarget : int ref
val maxgen : int option ref
val in_search : bool ref
(* data *)
val progd: prog set ref
val embd : (term, real vector) dict ref
val wind : (int, prog) dict ref
(* game *)
val game : (board,move) mcts.game
(* players *)
val player_uniform : tnn -> player
val player_wtnn : tnn -> player
val player_wtnn_cache : tnn -> player
val player_glob : (tnn -> player) ref
(* replaying solutions *)
val linearize : prog -> (board * move) list
val apply_movel : move list -> board -> board
val random_board : int -> board
val random_prog : int -> prog
(* search parameters *)
val wnoise_flag : bool ref
val noise_coeff_glob : real ref
val noise_flag : bool ref
val nsim_opt : int option ref
val time_opt : real option ref
val coreid_glob : int ref
(* train parameters *)
val use_mkl : bool ref
val dim_glob : int ref
val get_tnndim : unit -> (term * int list) list
(* functions *)
val search : tnn -> int -> (int * prog) list
val trainf : string -> unit
(* reinforcement learning *)
val expname : string ref
val ngen_glob : int ref
val rl_search_only : string -> int -> unit
val rl_train_only : string -> int -> unit
val rl_search : string -> int -> unit
val rl_train : string -> int -> unit
val parspec : (tnn, int, (int * prog) list) smlParallel.extspec
(* reading solutions *)
val read_isol : int -> (int * prog) list
(* interactive search *)
val search_target : mlTreeNeuralNetwork.tnn -> Arbint.int list ->
kernel.prog option
end