Python State.terminal Beispiele

Programmiersprache: Python

Namespace / Paketname: game

Klasse / Typ: State

Methode / Funktion: terminal

Beispiele auf hotexamples.com: 3

Python State.terminal - 3 Beispiele gefunden. Dies sind die am besten bewerteten Python Beispiele für die game.State.terminal, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

State(30)

is_done(30)

next(30)

legal_actions(24)

is_first_player(20)

is_lose(14)

position_to_action(4)

next_state(3)

get_state(3)

pieces_array(3)

get_available_actions(3)

terminal(3)

tick_time(3)

total_time(3)

opponent(2)

put_obstacles(2)

update(2)

make_move(2)

whiteDisplay(2)

generateActionFromString(2)

blackDisplay(2)

get_state_result(2)

get_next_state(2)

gameOver(2)

leader(1)

board(1)

copy(1)

step(1)

sid(1)

show_board(1)

get_cell(1)

put_center(1)

apply_moves(1)

players(1)

player_name(1)

play_move(1)

get_legal_moves(1)

piece_count(1)

initialise(1)

is_player_won(1)

legal_move(1)

Beispiel #1

Datei anzeigen

Datei: q2.py Projekt: axelahmer/easy21

def sarsa(lamb: int, num_episodes: int, Qstar, record=False):
    Q = state_action_map(plus=True)
    N = state_action_map()
    N_s = state_map(plus=True)
    mses = []
    for k in range(num_episodes):
        E = state_action_map()
        s = State(deal=True)
        a = get_e_greedy_action(Q, N_s, s)
        while not s.terminal():
            N_s[s.get_state()] += 1
            N[s.get_state(), a] += 1
            s_dash, r = step(s, a)
            a_dash = get_e_greedy_action(Q, N_s, s_dash)
            delta = r + Q[s_dash.get_state(), a_dash] - Q[s.get_state(), a]
            E[s.get_state(), a] += 1

            for d in DEALER_RANGE:
                for p in PLAYER_RANGE:
                    for action in ACTIONS:
                        Q[(d, p),
                          action] += (1 /
                                      (N[(d, p), action] + 1e-9)) * delta * E[
                                          (d, p), action]
                        E[(d, p), action] *= lamb
            s = s_dash
            a = a_dash
        if record:
            mses.append(calc_mse(Q, Qstar))
    return Q, mses

Beispiel #2

Datei anzeigen

Datei: utils.py Projekt: axelahmer/easy21

def sample_episode(pi):
    history = []
    s = State(deal=True)

    while not s.terminal():
        a = pi[s.get_state()]
        # rewards do not need to be appended to history as rewards are only *rewarded* when entering the terminal state.
        history.append([s.get_state(), a])
        s, r = step(s, a)

    return history, r

Beispiel #3

Datei anzeigen

def sarsa(lamb: int, num_episodes: int, Qstar, record=False):
    alpha = ALPHA
    w = np.zeros(36)
    # w = np.random.uniform(-1, 1, 36)
    mses = []
    for k in range(num_episodes):
        E = np.zeros(36)
        s = State(deal=True)
        a = get_e_greedy_action(s, w)
        while not s.terminal():
            x = phi(s, a)
            s_dash, r = step(s, a)
            a_dash = get_e_greedy_action(s_dash, w)

            delta = r + q_hat(s_dash, a_dash, w) - q_hat(s, a, w)
            E = np.add(np.multiply(E, lamb), x)
            dw = np.multiply(E, alpha * delta)
            w += dw

            s = s_dash
            a = a_dash
        if record:
            mses.append(calc_mse_linear(w, Qstar))
    return w, mses