def test_dqn( observation_shape, action_size, n_critics, q_func_factory, scaler, target_reduction_type, ): dqn = DQN( n_critics=n_critics, q_func_factory=q_func_factory, scaler=scaler, target_reduction_type=target_reduction_type, ) algo_tester(dqn, observation_shape) algo_update_tester(dqn, observation_shape, action_size, discrete=True)
def test_dqn_performance(q_func_type): dqn = DQN(n_epochs=1, q_func_type=q_func_type) algo_cartpole_tester(dqn)
def test_dqn(observation_shape, action_size, q_func_type, scaler): dqn = DQN(q_func_type=q_func_type, scaler=scaler) algo_tester(dqn, observation_shape) algo_update_tester(dqn, observation_shape, action_size, discrete=True)
def test_dqn_performance(q_func_factory): dqn = DQN(q_func_factory=q_func_factory) algo_cartpole_tester(dqn)