示例#1
0
 def test_offpol_sarsa(cls):
     data_df = run('offpol_sarsa')
     assert isinstance(data_df, pd.DataFrame)
示例#2
0
 def test_dqn_v1(cls):
     data_df = run('dqn_v1')
     assert isinstance(data_df, pd.DataFrame)
示例#3
0
 def test_quickstart_dqn(cls):
     data_df = run('quickstart_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#4
0
 def test_double_dqn(cls):
     data_df = run('double_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#5
0
 def test_lunar_dqn(cls):
     data_df = run('lunar_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#6
0
 def test_q_table(cls):
     data_df = run('q_table')
     assert isinstance(data_df, pd.DataFrame)
示例#7
0
 def test_dqn_epsilon(cls):
     data_df = run('dqn_epsilon')
     assert isinstance(data_df, pd.DataFrame)
示例#8
0
 def test_acrobot(cls):
     data_df = run('acrobot')
     assert isinstance(data_df, pd.DataFrame)
示例#9
0
 def test_pendulum_ddpg(cls):
     data_df = run('pendulum_ddpg')
     assert isinstance(data_df, pd.DataFrame)
示例#10
0
 def test_quickstart_dqn(cls):
     data_df = run('quickstart_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#11
0
 def test_breakout_dqn(cls):
     data_df = run('breakout_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#12
0
 def test_walker_ddpg_linearnoise(cls):
     data_df = run('walker_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
示例#13
0
 def test_lunar_freeze(cls):
     data_df = run('lunar_freeze')
     assert isinstance(data_df, pd.DataFrame)
示例#14
0
 def test_pendulum_ddpg_linearnoise(cls):
     data_df = run('pendulum_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
示例#15
0
 def test_cartpole_ac_argmax(cls):
     data_df = run('cartpole_ac_argmax')
     assert isinstance(data_df, pd.DataFrame)
示例#16
0
 def test_exp_sarsa(cls):
     data_df = run('exp_sarsa')
     assert isinstance(data_df, pd.DataFrame)
示例#17
0
 def test_dqn_v1(cls):
     data_df = run('dqn_v1')
     assert isinstance(data_df, pd.DataFrame)
示例#18
0
 def test_lunar_dqn(cls):
     data_df = run('lunar_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#19
0
 def test_pendulum_ddpg_linearnoise(cls):
     data_df = run('pendulum_ddpg_linearnoise')
     assert isinstance(data_df, pd.DataFrame)
示例#20
0
 def test_gym_tour(cls):
     data_df = run('dummy')
     assert isinstance(data_df, pd.DataFrame)
示例#21
0
 def test_run_q_table(self):
     metrics_df = run('q_table')
     assert isinstance(metrics_df, pd.DataFrame)
示例#22
0
 def test_dqn_pass(cls):
     data_df = run('test_dqn_pass')
     max_total_rewards = data_df['max_total_rewards_stats_mean'][0]
     print(max_total_rewards)
     assert max_total_rewards > 50, 'dqn failed to hit max_total_rewards'
示例#23
0
 def test_run_dqn(self):
     metrics_df = run('dqn')
     assert isinstance(metrics_df, pd.DataFrame)
示例#24
0
 def test_dqn_epsilon(cls):
     data_df = run('dqn_epsilon')
     assert isinstance(data_df, pd.DataFrame)
示例#25
0
 def test_run_mountain_double_dqn(self):
     metrics_df = run('mountain_double_dqn')
     assert isinstance(metrics_df, pd.DataFrame)
示例#26
0
 def test_exp_sarsa(cls):
     data_df = run('exp_sarsa')
     assert isinstance(data_df, pd.DataFrame)
示例#27
0
 def test_run_gym_tour(self):
     metrics_df = run('dummy')
     assert isinstance(metrics_df, pd.DataFrame)
示例#28
0
 def test_cartpole_ac_argmax(cls):
     data_df = run('cartpole_ac_argmax')
     assert isinstance(data_df, pd.DataFrame)
示例#29
0
from rl.experiment import run

if __name__ == '__main__':
    # run('dev_dqn', times=2, param_selection=True)
    # run('dqn', times=2, param_selection=False)
    run('lunar_dqn', times=5, param_selection=True)
    # run('DevCartPole-v0_DQN_HighLowMemoryWithForgetting_BoltzmannPolicy_NoPreProcessor_2017-01-21_191023_e0', plot_only=True)
    # run('lunar_dqn', times=3, param_selection=True, line_search=True)
    # run('breakout_dqn', times=1, param_selection=True)
示例#30
0
 def test_acrobot(cls):
     data_df = run('acrobot')
     assert isinstance(data_df, pd.DataFrame)
示例#31
0
 def test_dqn(cls):
     data_df = run('double_dqn_per')
     assert isinstance(data_df, pd.DataFrame)
示例#32
0
 def test_mountain_dqn(cls):
     data_df = run('mountain_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#33
0
 def test_gym_tour(cls):
     data_df = run('dummy')
     assert isinstance(data_df, pd.DataFrame)
示例#34
0
 def test_offpol_sarsa(cls):
     data_df = run('offpol_sarsa')
     assert isinstance(data_df, pd.DataFrame)
示例#35
0
 def test_q_table(cls):
     data_df = run('q_table')
     assert isinstance(data_df, pd.DataFrame)
示例#36
0
 def test_mountain_dqn(cls):
     data_df = run('mountain_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#37
0
 def test_dqn_pass(cls):
     data_df = run('test_dqn_pass')
     max_total_rewards = data_df['max_total_rewards_stats_mean'][0]
     print(max_total_rewards)
     assert max_total_rewards > 50, 'dqn failed to hit max_total_rewards'
示例#38
0
 def test_breakout_double_dqn(cls):
     data_df = run('breakout_double_dqn')
     assert isinstance(data_df, pd.DataFrame)
示例#39
0
from rl.experiment import run
from rl.util import args

if __name__ == '__main__':
    run(args.experiment, **vars(args))