Python TicTacToe.get_initial_state 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: games.tictactoe

클래스/타입: TicTacToe

메소드/함수: get_initial_state

hotexamples.com에서의 예제들: 2

Python TicTacToe.get_initial_state - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 games.tictactoe.TicTacToe.get_initial_state에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

TicTacToe(13)

count_lines(3)

get_initial_state(2)

available_moves(1)

check_move_validity(1)

get_possible_next_steps(1)

get_state(1)

make_move(1)

print_board(1)

print_brd(1)

print_grid(1)

print_move_grid(1)

take_action(1)

update(1)

winner(1)

예제 #1

파일 보기

    def test_priornet_tictactoe_self_play(self):
        ttt = TicTacToe()
        nn = NeuralNetwork(ttt, PriorNet)

        t = Trainer(ttt, nn, num_simulations=2, num_games=1, num_updates=0, buffer_size_limit=None, cpuct=1, num_threads=4)
        data = t.self_play(temperature=0)

        np.testing.assert_equal(data[:,-1], np.array([1, -1, 1, -1, 1, -1, 1]))
        s = ttt.get_initial_state()
        np.testing.assert_equal(data[0,0], s)
        np.testing.assert_equal(data[0,1], np.array([0, 1, 0, 0, 0, 0, 0, 0, 0]))
        s = ttt.take_action(s, np.array([[0,1,0],[0,0,0],[0,0,0]])) # Top-middle X
        np.testing.assert_equal(data[1,0], s) 
        np.testing.assert_equal(data[1,1], np.array([1, 0, 0, 0, 0, 0, 0, 0]))
        s = ttt.take_action(s, np.array([[1,0,0],[0,0,0],[0,0,0]])) # Top-left O
        np.testing.assert_equal(data[2,0], s)
        np.testing.assert_equal(data[2,1], np.array([1, 0, 0, 0, 0, 0, 0]))
        s = ttt.take_action(s, np.array([[0,0,1],[0,0,0],[0,0,0]])) # Top-right X
        np.testing.assert_equal(data[3,0], s)
        np.testing.assert_equal(data[3,1], np.array([1, 0, 0, 0, 0, 0]))
        s = ttt.take_action(s, np.array([[0,0,0],[1,0,0],[0,0,0]])) # Mid-left O
        np.testing.assert_equal(data[4,0], s)
        np.testing.assert_equal(data[4,1], np.array([1, 0, 0, 0, 0]))
        s = ttt.take_action(s, np.array([[0,0,0],[0,1,0],[0,0,0]])) # Mid-mid X
        np.testing.assert_equal(data[5,0], s)
        np.testing.assert_equal(data[5,1], np.array([1, 0, 0, 0]))
        s = ttt.take_action(s, np.array([[0,0,0],[0,0,1],[0,0,0]])) # Mid-right O
        np.testing.assert_equal(data[6,0], s)
        np.testing.assert_equal(data[6,1], np.array([1, 0, 0]))

예제 #2

파일 보기

 def test_policy_iteration(self):
     ttt = TicTacToe()
     nn = NeuralNetwork(ttt, PriorNet)
     t = Trainer(ttt, nn, num_simulations=2, num_games=100, num_updates=0, buffer_size_limit=None, cpuct=1, num_threads=4)
     t.policy_iteration()
     states = t.training_data[:,0]
     inits = 0
     for s in states:
         if (s.astype(np.float32) == ttt.get_initial_state()).all():
             inits += 1
     self.assertEqual(inits, 100)