Esempi in Python per QLearningTable.feedQTable

Linguaggio di programmazione: Python

Spazio dei nomi/nome del pacchetto: RL_brain

Classe/tipologia: QLearningTable

Metodo/funzione: feedQTable

Esempi su hotexamples.com: 3

QLearningTable.feedQTable in Python: 3 esempi trovati. Questi sono i migliori esempi reali in Python per RL_brain.QLearningTable.feedQTable, estratti da progetti open source. Li puoi valutare, per aiutarci a migliorare la qualità dei nostri esempi.

Metodi utilizzati di frequente

Mostra Nascondi

QLearningTable(30)

choose_action(12)

learn(10)

epsilon(5)

feedQTable(3)

q_table(3)

choose_action_real(2)

gamma(1)

plotCumulativeReward(1)

plot_cost(1)

print_q_table(1)

saveQTable(1)

save_q_table(1)

step(1)

Esempio n. 1

Mostra file

File: run.py Progetto: ettzzz/RL_traffic_control

def main():
    # --------------preparation--------------------
    rst_path, sim_path = generatePath(
        current_time)  # Create a new folder for the experiment
    RL = QLearningTable(list(range(
        len(green_states))))  # Initialize the Q-learning framework
    feed_path = '{}/results/{}/qtable.csv'.format(WORKSPACE, 'p5i3g0')
    RL.feedQTable(
        feed_path
    )  # This could be helpful when inheriting from previous trained agent
    # ---------------training--------------------
    trainAgent(RL, rst_path, sim_path)
    # --------------testing--------------------
    RL.epsilon = 1  # Epsilon-greedy no longer selects random actions
    fixed, rl, actuated = testAgent('fixed', RL), testAgent('rl',
                                                            RL), testAgent(
                                                                'actuated', RL)
    plotTestResult(rl, fixed, actuated, sim_path)
    flow_scenarios = ['-50%', '-25%', '0%', '+25%', '+50%']
    pushAgent(flow_scenarios, sim_path,
              RL)  # Explore the limit of the trained agent
    # --------------results----------------------
    RL.saveQTable('{}/qtable.csv'.format(sim_path))
    RL.plotCumulativeReward(sim_path)  # Plot the cumulative reward
    RL_params = {
        'lr': RL.alpha,
        'gamma': RL.gamma,
        'e_max': RL.e_greedy_max,
        'e_inc': RL.e_greedy_increment
    }
    writeLog(RL_params, rst_path, sim_path,
             clean=True)  # Record some basic information of the experiment
    # --------------end--------------------
    print('\nALL DONE, check {}'.format(str(current_time)))

Esempio n. 2

Mostra file

def main():
    trained_number = getLastExperiment('p5i3g0')
    RL = QLearningTable(list(range(len(green_states))))
    trained_path = '{}/results/{}/'.format(WORKSPACE, trained_number)
    qtable_path = trained_path + 'qtable.csv'
    RL.feedQTable(qtable_path)
    RL.epsilon = 1
    fixed,rl,actuated = testAgent('fixed', RL), testAgent('rl', RL), testAgent('actuated', RL)
    plotTestResult(rl, fixed, actuated, trained_path)

Esempio n. 3

Mostra file

File: verify_single.py Progetto: ettzzz/RL_traffic_control

            if env.isCheckpoint():
                o, s = env.getCurrentOccasion()
                a = RL.chooseAction(s, o)
                env.prolongTL(a)

        if step % VERIFY_INTERVAL == 0:
            env.calWaitingTime()
        step += 1
        env.conn.simulationStep()

    env.conn.close()
    sys.stdout.flush()

    print(round(np.mean(env.waitingtime), 2), len(env.waitingtime))
    return env.waitingtime


if __name__ == '__main__':
    from RL_brain import QLearningTable
    from global_var import green_states, WORKSPACE

    trained_path = '{}/results/{}/'.format(WORKSPACE, 'p5i3g0')
    qtable_path = trained_path + 'qtable.csv'
    RL = QLearningTable(list(range(len(green_states))))
    RL.feedQTable(qtable_path)
    RL.epsilon = 1
    fixed, rl, actuated = testAgent('fixed', RL), testAgent('rl',
                                                            RL), testAgent(
                                                                'actuated', RL)
    plotTestResult(rl, fixed, actuated, trained_path)