diff --git a/README.md b/README.md index 943e08d..d0bd5e7 100644 --- a/README.md +++ b/README.md @@ -13,8 +13,10 @@ pip install -e . ### Coding example ```python import gym +import gym_go -go_env = gym.make('gym_go:go-v0', size=7, komi=0, reward_method='real') +go_env = gym.make('go-v0', size=7, komi=0, reward_method='real') +go_env.reset() first_action = (2,5) second_action = (5,2) diff --git a/demo.py b/demo.py index 9c9d2d5..7d6a05f 100644 --- a/demo.py +++ b/demo.py @@ -1,6 +1,7 @@ import argparse import gym +import gym_go # Arguments parser = argparse.ArgumentParser(description='Demo Go Environment') @@ -9,7 +10,8 @@ args = parser.parse_args() # Initialize environment -go_env = gym.make('gym_go:go-v0', size=args.boardsize, komi=args.komi) +go_env = gym.make('go-v0', size=args.boardsize, komi=args.komi) +go_env.reset() # Game loop done = False diff --git a/gym_go/tests/efficiency.py b/gym_go/tests/efficiency.py index 7b179b7..392ca11 100644 --- a/gym_go/tests/efficiency.py +++ b/gym_go/tests/efficiency.py @@ -2,6 +2,7 @@ import unittest import gym +import gym_go import numpy as np from tqdm import tqdm @@ -11,7 +12,7 @@ class Efficiency(unittest.TestCase): iterations = 64 def setUp(self) -> None: - self.env = gym.make('gym_go:go-v0', size=self.boardsize, reward_method='real') + self.env = gym.make('go-v0', size=self.boardsize, reward_method='real') def testOrderedTrajs(self): durs = [] diff --git a/gym_go/tests/test_basics.py b/gym_go/tests/test_basics.py index 307ed1f..e015460 100644 --- a/gym_go/tests/test_basics.py +++ b/gym_go/tests/test_basics.py @@ -10,13 +10,13 @@ class TestGoEnvBasics(unittest.TestCase): def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) - self.env = gym.make('gym_go:go-v0', size=7, reward_method='real') + self.env = gym.make('go-v0', size=7, reward_method='real') def setUp(self): self.env.reset() def test_state(self): - env = gym.make('gym_go:go-v0', size=7) + env = gym.make('go-v0', size=7) state = env.reset() self.assertIsInstance(state, np.ndarray) self.assertEqual(state.shape[0], govars.NUM_CHNLS) @@ -27,7 +27,7 @@ def test_board_sizes(self): expected_sizes = [7, 13, 19] for expec_size in expected_sizes: - env = gym.make('gym_go:go-v0', size=expec_size) + env = gym.make('go-v0', size=expec_size) state = env.reset() self.assertEqual(state.shape[1], expec_size) self.assertEqual(state.shape[2], expec_size) @@ -150,7 +150,7 @@ def test_game_does_not_end_with_disjoint_passes(self): self.assertFalse(done) def test_num_liberties(self): - env = gym.make('gym_go:go-v0', size=7) + env = gym.make('go-v0', size=7) steps = [(0, 0), (0, 1)] libs = [(2, 0), (1, 2)] @@ -173,7 +173,8 @@ def test_num_liberties(self): self.assertEqual(whitelibs, libs[1], state) def test_komi(self): - env = gym.make('gym_go:go-v0', size=7, komi=2.5, reward_method='real') + env = gym.make('go-v0', size=7, komi=2.5, reward_method='real') + env.reset() # White win _ = env.step(None) @@ -223,7 +224,8 @@ def test_children(self): self.assertTrue((children[a] == 0).all()) def test_real_reward(self): - env = gym.make('gym_go:go-v0', size=7, reward_method='real') + env = gym.make('go-v0', size=7, reward_method='real') + env.reset() # In game state, reward, done, info = env.step((0, 0)) @@ -258,7 +260,8 @@ def test_real_reward(self): env.close() def test_heuristic_reward(self): - env = gym.make('gym_go:go-v0', size=7, reward_method='heuristic') + env = gym.make('go-v0', size=7, reward_method='heuristic') + env.reset() # In game state, reward, done, info = env.step((0, 0)) diff --git a/gym_go/tests/test_invalid_moves.py b/gym_go/tests/test_invalid_moves.py index 3693bbe..2bb85ca 100644 --- a/gym_go/tests/test_invalid_moves.py +++ b/gym_go/tests/test_invalid_moves.py @@ -11,7 +11,7 @@ class TestGoEnvInvalidMoves(unittest.TestCase): def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) - self.env = gym.make('gym_go:go-v0', size=7, reward_method='real') + self.env = gym.make('go-v0', size=7, reward_method='real') def setUp(self): self.env.reset() @@ -185,7 +185,8 @@ def test_small_suicide(self): :return: """ - self.env = gym.make('gym_go:go-v0', size=3, reward_method='real') + self.env = gym.make('go-v0', size=3, reward_method='real') + self.env.reset() for move in [6, 7, 8, 5, 4, 8, 0, 1]: state, reward, done, info = self.env.step(move) @@ -202,7 +203,8 @@ def test_invalid_after_capture(self): :return: """ - self.env = gym.make('gym_go:go-v0', size=3, reward_method='real') + self.env = gym.make('go-v0', size=3, reward_method='real') + self.env.reset() for move in [0, 8, 6, 4, 1, 2, 3, 7]: state, reward, done, info = self.env.step(move) diff --git a/gym_go/tests/test_valid_moves.py b/gym_go/tests/test_valid_moves.py index 0e54064..a3806b5 100644 --- a/gym_go/tests/test_valid_moves.py +++ b/gym_go/tests/test_valid_moves.py @@ -10,7 +10,7 @@ class TestGoEnvValidMoves(unittest.TestCase): def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) - self.env = gym.make('gym_go:go-v0', size=7, reward_method='real') + self.env = gym.make('go-v0', size=7, reward_method='real') def setUp(self): self.env.reset() diff --git a/setup.py b/setup.py index d33850a..c86abb7 100644 --- a/setup.py +++ b/setup.py @@ -3,5 +3,5 @@ setup( name='gym_go', version='0.0.1', - install_requires=['gym'] # and other dependencies + install_requires=['gym==0.23.1'] # and other dependencies )