コード例 #1
0
def build_q_model_and_distribution(
    policy: Policy,
    obs_space: gym.spaces.Space,
    action_space: gym.spaces.Space,
    config: TrainerConfigDict,
) -> Tuple[ModelV2, TorchDistributionWrapper]:
    return build_q_models(policy, obs_space, action_space,
                          config), TorchCategorical
コード例 #2
0
def build_q_model_and_distribution(policy, obs_space, action_space, config):
    return build_q_models(policy, obs_space, action_space, config), \
        TorchCategorical