In [1]:
import torch
from torch.distributions.dirichlet import Dirichlet

In [2]:
from hexconvolution import NoMCTSModel
from hexboard import Board
from hexgame import HexGame

In [3]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

In [4]:
noise = Dirichlet(torch.full((121,),0.03))
model = NoMCTSModel(board_size=11, layers=5)

In [5]:
board = Board(size=11)

In [6]:
board

Board
[[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]]
Legal moves
{(7, 3), (6, 9), (0, 7), (1, 6), (0, 10), (3, 7), (2, 5), (8, 5), (5, 8), (4, 0), (10, 8), (9, 0), (6, 7), (5, 5), (10, 7), (7, 6), (6, 10), (0, 4), (1, 1), (4, 10), (3, 2), (2, 6), (8, 2), (4, 5), (9, 3), (6, 0), (7, 5), (0, 1), (3, 1), (9, 9), (7, 8), (2, 1), (8, 9), (9, 4), (5, 1), (10, 3), (7, 2), (1, 5), (3, 6), (2, 2), (1, 10), (8, 6), (4, 1), (10, 9), (9, 7), (6, 4), (5, 4), (10, 4), (7, 1), (0, 5), (1, 0), (0, 8), (3, 5), (2, 7), (8, 3), (5, 10), (4, 6), (10, 10), (9, 2), (6, 1), (5, 7), (7, 4), (0, 2), (1, 3), (4, 8), (3, 0), (2, 8), (9, 8), (8, 0), (6, 2), (3, 10), (8,

In [7]:
hexgame = HexGame(board, model, device, noise, noise_level=0.25, temperature=0.1)

In [8]:
board_states, moves, targets = hexgame.play_moves()

In [9]:
hexgame

Board
[[-1.  1.  1. -1.  1.  1. -1. -1.  1. -1.  1.]
 [ 1.  1. -1. -1. -1.  1.  1. -1.  1.  1. -1.]
 [ 1. -1. -1. -1. -1. -1. -1. -1. -1.  0.  1.]
 [ 1.  0. -1.  1.  1.  1. -1. -1. -1. -1.  1.]
 [ 1.  1. -1.  1.  1. -1.  1. -1.  1. -1. -1.]
 [-1. -1.  1.  1. -1.  1. -1.  1.  1.  1. -1.]
 [ 1.  1. -1.  1. -1.  1. -1.  1. -1.  1.  1.]
 [-1. -1. -1.  1.  1.  1. -1.  1. -1. -1.  1.]
 [-1. -1.  1.  1.  1. -1.  1. -1.  1.  1.  1.]
 [ 1. -1.  1.  0. -1.  1. -1. -1. -1. -1.  1.]
 [ 1.  1. -1. -1.  1. -1.  1. -1.  1. -1. -1.]]
Legal moves
{(9, 3), (3, 1), (2, 9)}
Illegal moves
{(7, 3), (6, 9), (0, 7), (1, 6), (0, 10), (3, 7), (2, 5), (8, 5), (5, 8), (4, 0), (10, 8), (9, 0), (6, 7), (5, 5), (10, 7), (7, 6), (6, 10), (0, 4), (1, 1), (4, 10), (3, 2), (2, 6), (8, 2), (4, 5), (6, 0), (7, 5), (0, 1), (9, 9), (7, 8), (2, 1), (8, 9), (9, 4), (5, 1), (10, 3), (7, 2), (1, 5), (3, 6), (2, 2), (1, 10), (8, 6), (4, 1), (10, 9), (9, 7), (6, 4), (5, 4), (10, 4), (7, 1), (0, 5), (1, 0), (0, 8), (3, 5), (2, 7),

In [10]:
hexgame.board.board_tensor

tensor([[[0., 1., 1., 0., 1., 1., 0., 0., 1., 0., 1.],
         [1., 1., 0., 0., 0., 1., 1., 0., 1., 1., 0.],
         [1., 0., 0., 0., 0., 0., 0., 0., 0., 0., 1.],
         [1., 0., 0., 1., 1., 1., 0., 0., 0., 0., 1.],
         [1., 1., 0., 1., 1., 0., 1., 0., 1., 0., 0.],
         [0., 0., 1., 1., 0., 1., 0., 1., 1., 1., 0.],
         [1., 1., 0., 1., 0., 1., 0., 1., 0., 1., 1.],
         [0., 0., 0., 1., 1., 1., 0., 1., 0., 0., 1.],
         [0., 0., 1., 1., 1., 0., 1., 0., 1., 1., 1.],
         [1., 0., 1., 0., 0., 1., 0., 0., 0., 0., 1.],
         [1., 1., 0., 0., 1., 0., 1., 0., 1., 0., 0.]],

        [[1., 0., 0., 1., 0., 0., 1., 1., 0., 1., 0.],
         [0., 0., 1., 1., 1., 0., 0., 1., 0., 0., 1.],
         [0., 1., 1., 1., 1., 1., 1., 1., 1., 0., 0.],
         [0., 0., 1., 0., 0., 0., 1., 1., 1., 1., 0.],
         [0., 0., 1., 0., 0., 1., 0., 1., 0., 1., 1.],
         [1., 1., 0., 0., 1., 0., 1., 0., 0., 0., 1.],
         [0., 0., 1., 0., 1., 0., 1., 0., 1., 0., 0.],
        