Python GameWrapper.execute_move示例

编程语言: Python

命名空间/包名称: othello.players.a2c_player_1.GameWrapper

类/类型: GameWrapper

方法/功能: execute_move

hotexamples.com的示例: 5

Python GameWrapper.execute_move - 已找到5个示例。这些是从开源项目中提取的最受好评的othello.players.a2c_player_1.GameWrapper.GameWrapper.execute_move现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

GameWrapper(7)

execute_move(5)

current_player(2)

reset(2)

convert_action_to_spot(1)

convert_spot_to_action(1)

示例#1

显示文件

    def test_execute_move_legal(self):
        # current player is p1
        game = GameWrapper(1)

        # place a piece, to flip (3,5)
        env_observation, reward, done, game, is_valid = game.execute_move(8 *
                                                                          3 +
                                                                          5)
        # expection:
        #   player switched,
        #   not done game,
        #   new board observation,
        #   reward 0.01, +1 new pieces
        self.assertTrue(is_valid)
        self.assertEqual(game.current_player, GameBoard.PLAYER_2)
        self.assertFalse(done)
        self.assertEqual(reward, 0.01)
        np.testing.assert_array_equal(
            env_observation,
            np.asarray([
                0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
                0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
                0.0, 0.0, 0.0, -1.0, -1.0, -1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0,
                -1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
                0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
                0.0, 0.0, 0.0, 0.0
            ]))

示例#2

显示文件

    def test_execute_move_pass(self):
        game = GameWrapper(1)
        old_observation = game.reset()

        env_observation, reward, done, game, is_valid = game.execute_move(
            game.PASS_TURN_ACTION)
        self.assertTrue(is_valid)
        np.testing.assert_array_equal(env_observation, old_observation * -1)
        self.assertEqual(reward, -0.01)
        self.assertFalse(done)

示例#3

显示文件

 def test_execute_move_illegal(self):
     game = GameWrapper(1)
     old_player = game.current_player
     # place at the corner. Not a valid move.
     env_observation, reward, done, game, is_valid = game.execute_move(0)
     # expecting: player not switched, same board observation, reward -0.01
     self.assertFalse(is_valid)
     self.assertEqual(old_player, game.current_player)
     self.assertEqual(reward, -0.01)
     self.assertFalse(done)
     np.testing.assert_array_equal(
         env_observation,
         np.asarray([
             0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
             0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
             0.0, 0.0, 0.0, 1.0, -1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, -1.0,
             1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
             0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
             0.0, 0.0, 0.0, 0.0
         ]))

示例#4

显示文件

 def test_execute_move_tie_p2(self):
     game_env = GameWrapper(1)
     game_env.current_player = GameBoard.PLAYER_2
     game_env.game_board.board = \
         list(map(lambda r: list(map(lambda i: i * -1.0, r)),
                  [[-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, ],
                   [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, ],
                   [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, ],
                   [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, ],
                   [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, ],
                   [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, ],
                   [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, ],
                   [1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, 0.0]]))
     # place at the last spot to win
     env_observation, reward, done, game_env, is_valid = game_env.execute_move(
         63)
     # expection:
     #   player switched to p1,
     #   game is done
     #   new board observation,
     #   reward 0.01, +1 new pieces
     self.assertTrue(is_valid)
     self.assertEqual(game_env.current_player, GameBoard.PLAYER_2)
     self.assertTrue(done)
     self.assertEqual(reward, 0)
     np.testing.assert_array_equal(
         env_observation,
         np.asarray([
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             -1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
         ]))

示例#5

显示文件

 def test_execute_move_win(self):
     game_env = GameWrapper(1)
     game_env.game_board.board = [[
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
     ], [
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
     ], [
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
     ], [
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
     ], [
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
     ], [
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
     ], [
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
         1.0,
     ], [1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, 0.0]]
     # place at the last spot to win
     env_observation, reward, done, game_env, is_valid = game_env.execute_move(
         63)
     # expection:
     #   player switched to p1,
     #   game is done
     #   new board observation,
     #   reward 0.01, +1 new pieces
     self.assertTrue(is_valid)
     self.assertEqual(game_env.current_player, GameBoard.PLAYER_1)
     self.assertTrue(done)
     self.assertEqual(reward, 64)
     np.testing.assert_array_equal(
         env_observation,
         np.asarray([
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
             1.0,
         ]))