Python QLearning.choose_action Examples

Programming Language: Python

Namespace/Package Name: q_learning

Class/Type: QLearning

Method/Function: choose_action

Examples at hotexamples.com: 2

Python QLearning.choose_action - 2 examples found. These are the top rated real world Python examples of q_learning.QLearning.choose_action extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

QLearning(30)

update(4)

run(3)

train(2)

load_table(2)

learn(2)

greedy_probability_policy(2)

get_policy(2)

get_action(2)

perform_sim_step(2)

set_general_state_action_values(2)

save_q_matrix(2)

choose_action(2)

action_to_maximise_q(2)

choose(2)

train_model(1)

reset_state(1)

plot_progress(1)

predict(1)

previous_action_idx(1)

previous_digitized_state(1)

q_table(1)

read_q_matrix(1)

update_state_action_function(1)

reset_epsilon(1)

reset_reward(1)

update_reward(1)

update_Qtable(1)

update_q_value(1)

transfer_model(1)

run_multiple_episodes(1)

sample_from_experience(1)

update_Q(1)

save(1)

save_experience(1)

save_q_model(1)

save_table(1)

select_action(1)

solve(1)

step(1)

test(1)

plot_avg_cost(1)

lr(1)

perform_lr_decay(1)

episode_companies_3(1)

action_values(1)

add_new_state(1)

assimilar(1)

best_action(1)

calc_new_q_value(1)

Example #1

Show file

File: 2048-QL.py Project: yogeshjadhav7/2048-RL-PolicyGradient

# In[ ]:

for episode in range(EPISODES):
    observation = env.reset()
    QL.curr_episode = episode

    while True:
        if RENDER_ENV: env.render()

        valid_move = False
        action = None

        while not valid_move:

            # Choose an action based on observation
            if action == None: action = QL.choose_action(observation)

            observation_, reward, done, info = env.step(action)
            valid_move = info['valid']

            reward = QL.calculate_reward(valid_move, done, reward,
                                         observation_)

            QL.save_experience(observation=observation,
                               action=action,
                               reward=reward,
                               observation_=observation_,
                               is_game_over=done,
                               is_move_valid=valid_move)

            action = (action + 1) % QL.n_y

Example #2

Show file

from q_state import next_state, random_state, actions
from q_learning import QLearning
from q_table import QTable

if __name__ == "__main__":
    episode = 100
    model_save_interval = 10

    table = QTable(actions)
    learning = QLearning(table)

    for step in range(episode):
        init_state = random_state()
        i = 0
        reward = 0
        while reward != 1:
            state = init_state
            while True:
                i += 1
                action = learning.choose_action(state)
                state2, reward, done = next_state(state, action, table)
                learning.learn(state, action, reward, state2, done)
                if done:
                    break
                state = state2
        print(init_state, i, len(table.q_table))
        if (step + 1) % model_save_interval == 0:
            table.save()