Esempio n. 1
0
 def test_offpol_sarsa(cls):
     data_df = run('offpol_sarsa')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 2
0
 def test_dqn_v1(cls):
     data_df = run('dqn_v1')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 3
0
 def test_quickstart_dqn(cls):
     data_df = run('quickstart_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 4
0
 def test_double_dqn(cls):
     data_df = run('double_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 5
0
 def test_lunar_dqn(cls):
     data_df = run('lunar_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 6
0
 def test_q_table(cls):
     data_df = run('q_table')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 7
0
 def test_dqn_epsilon(cls):
     data_df = run('dqn_epsilon')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 8
0
 def test_acrobot(cls):
     data_df = run('acrobot')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 9
0
 def test_pendulum_ddpg(cls):
     data_df = run('pendulum_ddpg')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 10
0
 def test_quickstart_dqn(cls):
     data_df = run('quickstart_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 11
0
 def test_breakout_dqn(cls):
     data_df = run('breakout_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 12
0
 def test_walker_ddpg_linearnoise(cls):
     data_df = run('walker_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 13
0
 def test_lunar_freeze(cls):
     data_df = run('lunar_freeze')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 14
0
 def test_pendulum_ddpg_linearnoise(cls):
     data_df = run('pendulum_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 15
0
 def test_cartpole_ac_argmax(cls):
     data_df = run('cartpole_ac_argmax')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 16
0
 def test_exp_sarsa(cls):
     data_df = run('exp_sarsa')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 17
0
 def test_dqn_v1(cls):
     data_df = run('dqn_v1')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 18
0
 def test_lunar_dqn(cls):
     data_df = run('lunar_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 19
0
 def test_pendulum_ddpg_linearnoise(cls):
     data_df = run('pendulum_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 20
0
 def test_gym_tour(cls):
     data_df = run('dummy')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 21
0
 def test_run_q_table(self):
     metrics_df = run('q_table')
     assert isinstance(metrics_df, pd.DataFrame)
Esempio n. 22
0
 def test_dqn_pass(cls):
     data_df = run('test_dqn_pass')
     max_total_rewards = data_df['max_total_rewards_stats_mean'][0]
     print(max_total_rewards)
     assert max_total_rewards > 50, 'dqn failed to hit max_total_rewards'
Esempio n. 23
0
 def test_run_dqn(self):
     metrics_df = run('dqn')
     assert isinstance(metrics_df, pd.DataFrame)
Esempio n. 24
0
 def test_dqn_epsilon(cls):
     data_df = run('dqn_epsilon')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 25
0
 def test_run_mountain_double_dqn(self):
     metrics_df = run('mountain_double_dqn')
     assert isinstance(metrics_df, pd.DataFrame)
Esempio n. 26
0
 def test_exp_sarsa(cls):
     data_df = run('exp_sarsa')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 27
0
 def test_run_gym_tour(self):
     metrics_df = run('dummy')
     assert isinstance(metrics_df, pd.DataFrame)
Esempio n. 28
0
 def test_cartpole_ac_argmax(cls):
     data_df = run('cartpole_ac_argmax')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 29
0
from rl.experiment import run

if __name__ == '__main__':
    # run('dev_dqn', times=2, param_selection=True)
    # run('dqn', times=2, param_selection=False)
    run('lunar_dqn', times=5, param_selection=True)
    # run('DevCartPole-v0_DQN_HighLowMemoryWithForgetting_BoltzmannPolicy_NoPreProcessor_2017-01-21_191023_e0', plot_only=True)
    # run('lunar_dqn', times=3, param_selection=True, line_search=True)
    # run('breakout_dqn', times=1, param_selection=True)
Esempio n. 30
0
 def test_acrobot(cls):
     data_df = run('acrobot')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 31
0
 def test_dqn(cls):
     data_df = run('double_dqn_per')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 32
0
 def test_mountain_dqn(cls):
     data_df = run('mountain_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 33
0
 def test_gym_tour(cls):
     data_df = run('dummy')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 34
0
 def test_offpol_sarsa(cls):
     data_df = run('offpol_sarsa')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 35
0
 def test_q_table(cls):
     data_df = run('q_table')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 36
0
 def test_mountain_dqn(cls):
     data_df = run('mountain_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 37
0
 def test_dqn_pass(cls):
     data_df = run('test_dqn_pass')
     max_total_rewards = data_df['max_total_rewards_stats_mean'][0]
     print(max_total_rewards)
     assert max_total_rewards > 50, 'dqn failed to hit max_total_rewards'
Esempio n. 38
0
 def test_breakout_double_dqn(cls):
     data_df = run('breakout_double_dqn')
     assert isinstance(data_df, pd.DataFrame)
Esempio n. 39
0
from rl.experiment import run
from rl.util import args

if __name__ == '__main__':
    run(args.experiment, **vars(args))