Python StateManager.is_legal Examples

Programming Language: Python

Namespace/Package Name: state_manager

Class/Type: StateManager

Method/Function: is_legal

Examples at hotexamples.com: 2

Python StateManager.is_legal - 2 examples found. These are the top rated real world Python examples of state_manager.StateManager.is_legal extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

StateManager(30)

calculate_next_state(9)

is_finished(4)

add_state(3)

increment_state(3)

get_winner(3)

make_move(3)

push(2)

read(2)

is_legal(2)

load(2)

get_moves(2)

get_legal_moves(2)

get_latest_state(2)

move(2)

player1_won(2)

player2_won(2)

print_board(2)

is_game_over(2)

process_request(2)

convert_to_move(2)

close_db(2)

create_game(2)

redo(1)

setReadyVersion(1)

setVersionStateOnDisk(1)

is_optimal(1)

jsonify(1)

setSubPkgsToRemoveOnRemoval(1)

load_gpi_state(1)

lookup(1)

setRpmsToRemoveOnRemoval(1)

setPilotName(1)

receive_state(1)

setFile(1)

new_state(1)

play_game(1)

save_last_exit(1)

run_for_unittest(1)

run(1)

print_state(1)

probe(1)

set_latest(1)

removeVersion(1)

reimage(1)

start(1)

indexing_constraints(1)

is_last_exit_from_reload(1)

draw_state(1)

getActiveVersion(1)

Example #1

Show file

File: neural_actor.py Project: Henkeboi/Deep-reinforcement-learning-multiplex-hexadiagonal-monte-carlo-tree-search

def main():
    board_size = 4
    max_num_moves = int(board_size ** 2)
    state_space_size = int(board_size ** 2 + 1)
    conv_layers = []
    state_space_size = 128
    hidden_layers = [state_space_size, max_num_moves] 
    la = 0.01

    state_manager = StateManager(board_size)
    num_simulations = 200

    player1 = NeuralActor(conv_layers, hidden_layers, max_num_moves, la, 'sgd')
    player2 = NeuralActor(conv_layers, hidden_layers, max_num_moves, la, 'sgd')
    mct1 = MCT(player1, num_simulations)
    mct2 = MCT(player2, num_simulations)

    train = False
    if train == True:
        start_time = time.time()
        for i in range(0, 100):
            mct1.play_game(copy.deepcopy(state_manager))
            training_data = mct1.get_training_data()
            loss = player1.update_Q(training_data)
            print(str(i) + " " +  str(loss))
        player1.store_model('data/16.3')
    else:
        player1.load_model('data/16.3')
        player2.load_model('data/16.3')

    win1 = 0
    win2 = 0
    for i in range(0, 1000):
        state_manager = StateManager(board_size)
        while not state_manager.player1_won() and not state_manager.player2_won():
            if not state_manager.player1_to_move:
                move_index = random.randrange(0, board_size ** 2)
                while not StateManager.is_legal(move_index, state_manager.string_representation()):
                   move_index = random.randrange(0, board_size ** 2)
                move = state_manager.convert_to_move(move_index)
                move = state_manager.convert_to_move(player2.get_action(state_manager.string_representation()))
            else:
                move_index = random.randrange(0, board_size ** 2)
                while not StateManager.is_legal(move_index, state_manager.string_representation()):
                   move_index = random.randrange(0, board_size ** 2)
                move = state_manager.convert_to_move(move_index)
                #move = state_manager.convert_to_move(player2.get_action(state_manager.string_representation()))
            state_manager.make_move(move)
            #state_manager.show()
        if state_manager.player1_won():
            win1 += 1
        elif state_manager.player2_won():
            win2 += 1
        else:
            print("No winner")
    print("Times player 1 won: " + str(win1) + ". " + "Times player2 won: " + str(win2))

Example #2

Show file

File: neural_actor.py Project: Henkeboi/Deep-reinforcement-learning-multiplex-hexadiagonal-monte-carlo-tree-search

 def get_action(self, state_str):
     state = np.fromstring(state_str, np.int8) - 48
     state = torch.from_numpy(state).float()
     nn_output = self.nn(state) # Forward pass
     move_index = torch.argmax(nn_output.data)
     while not StateManager.is_legal(move_index, state_str):
         nn_output.data[0, move_index] = -1.0
         move_index = torch.argmax(nn_output.data)
     return move_index.item()