Exemple #1
0
 def test_offpol_sarsa(cls):
     data_df = run('offpol_sarsa')
     assert isinstance(data_df, pd.DataFrame)
Exemple #2
0
 def test_dqn_v1(cls):
     data_df = run('dqn_v1')
     assert isinstance(data_df, pd.DataFrame)
Exemple #3
0
 def test_quickstart_dqn(cls):
     data_df = run('quickstart_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #4
0
 def test_double_dqn(cls):
     data_df = run('double_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #5
0
 def test_lunar_dqn(cls):
     data_df = run('lunar_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #6
0
 def test_q_table(cls):
     data_df = run('q_table')
     assert isinstance(data_df, pd.DataFrame)
 def test_dqn_epsilon(cls):
     data_df = run('dqn_epsilon')
     assert isinstance(data_df, pd.DataFrame)
Exemple #8
0
 def test_acrobot(cls):
     data_df = run('acrobot')
     assert isinstance(data_df, pd.DataFrame)
Exemple #9
0
 def test_pendulum_ddpg(cls):
     data_df = run('pendulum_ddpg')
     assert isinstance(data_df, pd.DataFrame)
 def test_quickstart_dqn(cls):
     data_df = run('quickstart_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #11
0
 def test_breakout_dqn(cls):
     data_df = run('breakout_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #12
0
 def test_walker_ddpg_linearnoise(cls):
     data_df = run('walker_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
Exemple #13
0
 def test_lunar_freeze(cls):
     data_df = run('lunar_freeze')
     assert isinstance(data_df, pd.DataFrame)
Exemple #14
0
 def test_pendulum_ddpg_linearnoise(cls):
     data_df = run('pendulum_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
 def test_cartpole_ac_argmax(cls):
     data_df = run('cartpole_ac_argmax')
     assert isinstance(data_df, pd.DataFrame)
Exemple #16
0
 def test_exp_sarsa(cls):
     data_df = run('exp_sarsa')
     assert isinstance(data_df, pd.DataFrame)
 def test_dqn_v1(cls):
     data_df = run('dqn_v1')
     assert isinstance(data_df, pd.DataFrame)
Exemple #18
0
 def test_lunar_dqn(cls):
     data_df = run('lunar_dqn')
     assert isinstance(data_df, pd.DataFrame)
 def test_pendulum_ddpg_linearnoise(cls):
     data_df = run('pendulum_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
Exemple #20
0
 def test_gym_tour(cls):
     data_df = run('dummy')
     assert isinstance(data_df, pd.DataFrame)
Exemple #21
0
 def test_run_q_table(self):
     metrics_df = run('q_table')
     assert isinstance(metrics_df, pd.DataFrame)
Exemple #22
0
 def test_dqn_pass(cls):
     data_df = run('test_dqn_pass')
     max_total_rewards = data_df['max_total_rewards_stats_mean'][0]
     print(max_total_rewards)
     assert max_total_rewards > 50, 'dqn failed to hit max_total_rewards'
Exemple #23
0
 def test_run_dqn(self):
     metrics_df = run('dqn')
     assert isinstance(metrics_df, pd.DataFrame)
Exemple #24
0
 def test_dqn_epsilon(cls):
     data_df = run('dqn_epsilon')
     assert isinstance(data_df, pd.DataFrame)
Exemple #25
0
 def test_run_mountain_double_dqn(self):
     metrics_df = run('mountain_double_dqn')
     assert isinstance(metrics_df, pd.DataFrame)
Exemple #26
0
 def test_exp_sarsa(cls):
     data_df = run('exp_sarsa')
     assert isinstance(data_df, pd.DataFrame)
Exemple #27
0
 def test_run_gym_tour(self):
     metrics_df = run('dummy')
     assert isinstance(metrics_df, pd.DataFrame)
Exemple #28
0
 def test_cartpole_ac_argmax(cls):
     data_df = run('cartpole_ac_argmax')
     assert isinstance(data_df, pd.DataFrame)
Exemple #29
0
from rl.experiment import run

if __name__ == '__main__':
    # run('dev_dqn', times=2, param_selection=True)
    # run('dqn', times=2, param_selection=False)
    run('lunar_dqn', times=5, param_selection=True)
    # run('DevCartPole-v0_DQN_HighLowMemoryWithForgetting_BoltzmannPolicy_NoPreProcessor_2017-01-21_191023_e0', plot_only=True)
    # run('lunar_dqn', times=3, param_selection=True, line_search=True)
    # run('breakout_dqn', times=1, param_selection=True)
Exemple #30
0
 def test_acrobot(cls):
     data_df = run('acrobot')
     assert isinstance(data_df, pd.DataFrame)
Exemple #31
0
 def test_dqn(cls):
     data_df = run('double_dqn_per')
     assert isinstance(data_df, pd.DataFrame)
Exemple #32
0
 def test_mountain_dqn(cls):
     data_df = run('mountain_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #33
0
 def test_gym_tour(cls):
     data_df = run('dummy')
     assert isinstance(data_df, pd.DataFrame)
Exemple #34
0
 def test_offpol_sarsa(cls):
     data_df = run('offpol_sarsa')
     assert isinstance(data_df, pd.DataFrame)
Exemple #35
0
 def test_q_table(cls):
     data_df = run('q_table')
     assert isinstance(data_df, pd.DataFrame)
Exemple #36
0
 def test_mountain_dqn(cls):
     data_df = run('mountain_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #37
0
 def test_dqn_pass(cls):
     data_df = run('test_dqn_pass')
     max_total_rewards = data_df['max_total_rewards_stats_mean'][0]
     print(max_total_rewards)
     assert max_total_rewards > 50, 'dqn failed to hit max_total_rewards'
Exemple #38
0
 def test_breakout_double_dqn(cls):
     data_df = run('breakout_double_dqn')
     assert isinstance(data_df, pd.DataFrame)
Exemple #39
0
from rl.experiment import run
from rl.util import args

if __name__ == '__main__':
    run(args.experiment, **vars(args))