예제 #1
0
def test_discrete_cql(
    observation_shape,
    action_size,
    n_critics,
    q_func_factory,
    scaler,
    target_reduction_type,
):
    cql = DiscreteCQL(
        n_critics=n_critics,
        q_func_factory=q_func_factory,
        scaler=scaler,
        target_reduction_type=target_reduction_type,
    )
    algo_tester(cql, observation_shape)
    algo_update_tester(cql, observation_shape, action_size, True)
예제 #2
0
def test_discrete_cql_performance(q_func_factory):
    cql = DiscreteCQL(q_func_factory=q_func_factory)
    algo_cartpole_tester(cql)
예제 #3
0
def test_discrete_cql(observation_shape, action_size, q_func_factory, scaler):
    cql = DiscreteCQL(q_func_factory=q_func_factory, scaler=scaler)
    algo_tester(cql, observation_shape)
    algo_update_tester(cql, observation_shape, action_size, True)
예제 #4
0
def test_discrete_cql_performance(q_func_type):
    cql = DiscreteCQL(n_epochs=1, q_func_type=q_func_type)
    algo_cartpole_tester(cql)