Python State.next_state Beispiele

Programmiersprache: Python

Namespace / Paketname: game

Klasse / Typ: State

Methode / Funktion: next_state

Beispiele auf hotexamples.com: 3

Python State.next_state - 3 Beispiele gefunden. Dies sind die am besten bewerteten Python Beispiele für die game.State.next_state, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

State(30)

is_done(30)

next(30)

legal_actions(24)

is_first_player(20)

is_lose(14)

position_to_action(4)

next_state(3)

get_state(3)

pieces_array(3)

get_available_actions(3)

terminal(3)

tick_time(3)

total_time(3)

opponent(2)

put_obstacles(2)

update(2)

make_move(2)

whiteDisplay(2)

generateActionFromString(2)

blackDisplay(2)

get_state_result(2)

get_next_state(2)

gameOver(2)

leader(1)

board(1)

copy(1)

step(1)

sid(1)

show_board(1)

get_cell(1)

put_center(1)

apply_moves(1)

players(1)

player_name(1)

play_move(1)

get_legal_moves(1)

piece_count(1)

initialise(1)

is_player_won(1)

legal_move(1)

Beispiel #1

Datei anzeigen

def play(next_actions):
    state = State()
    while True:
        if state.is_done():
            break
        action_idx = 0 if state.is_first_player() else 1
        next_action = next_actions[action_idx]
        action = next_action(state)
        state = state.next_state(action)
    return first_player_point(state)

Beispiel #2

Datei anzeigen

Datei: self_play.py Projekt: tsukker/AlphaZero_AI_book

def play(model):
    history = []
    state = State()
    while True:
        if state.is_done():
            break
        scores = pv_mcts_scores(model, state, SP_TEMPERATURE)

        # Add state and policy into history
        policies = [0 for _ in range(DN_OUTPUT_SIZE)]
        for action, policy in zip(state.legal_actions(), scores):
            policies[action] = policy
        history.append([[state.pieces, state.enemy_pieces], policies, None])

        action = np.random.choice(state.legal_actions(), p=scores)
        state = state.next_state(action)
    value = first_player_value(state)
    for i in range(len(history)):
        history[i][2] = value
        value = -value
    return history

Beispiel #3

Datei anzeigen

Datei: pv_mcts.py Projekt: tsukker/AlphaZero_AI_book

        C_PUCT = 1.0
        t = sum(nodes_to_scores(self.child_nodes))
        pucb_values = [
            (-child_node.w / child_node.n if child_node.n > 0 else 0.0) +
            C_PUCT * child_node.policy * math.sqrt(t) / (1 + child_node.n)
            for child_node in self.child_nodes
        ]
        return self.child_nodes[np.argmax(pucb_values)]


def pv_mcts_action(model, temperature=0):
    def pv_mcts_action(state):
        scores = pv_mcts_scores(model, state, temperature)
        return np.random.choice(state.legal_actions(), p=scores)

    return pv_mcts_action


if __name__ == '__main__':
    path = sorted(Path('./model').glob('*.h5'))[-1]
    model = tf.keras.models.load_model(str(path))
    state = State()
    next_action = pv_mcts_action(model, 1.0)

    while True:
        if state.is_done():
            break
        action = next_action(state)
        state = state.next_state(action)
        print(state)