def test_discrete_cql( observation_shape, action_size, n_critics, q_func_factory, scaler, target_reduction_type, ): cql = DiscreteCQL( n_critics=n_critics, q_func_factory=q_func_factory, scaler=scaler, target_reduction_type=target_reduction_type, ) algo_tester(cql, observation_shape) algo_update_tester(cql, observation_shape, action_size, True)
def test_discrete_cql_performance(q_func_factory): cql = DiscreteCQL(q_func_factory=q_func_factory) algo_cartpole_tester(cql)
def test_discrete_cql(observation_shape, action_size, q_func_factory, scaler): cql = DiscreteCQL(q_func_factory=q_func_factory, scaler=scaler) algo_tester(cql, observation_shape) algo_update_tester(cql, observation_shape, action_size, True)
def test_discrete_cql_performance(q_func_type): cql = DiscreteCQL(n_epochs=1, q_func_type=q_func_type) algo_cartpole_tester(cql)