def build_sac_model_and_action_dist( policy: Policy, obs_space: gym.spaces.Space, action_space: gym.spaces.Space, config: TrainerConfigDict) -> \ Tuple[ModelV2, Type[TorchDistributionWrapper]]: """Constructs the necessary ModelV2 and action dist class for the Policy. Args: policy (Policy): The TFPolicy that will use the models. obs_space (gym.spaces.Space): The observation space. action_space (gym.spaces.Space): The action space. config (TrainerConfigDict): The SAC trainer's config dict. Returns: ModelV2: The ModelV2 to be used by the Policy. Note: An additional target model will be created in this function and assigned to `policy.target_model`. """ model = build_sac_model(policy, obs_space, action_space, config) action_dist_class = _get_dist_class(config, action_space) return model, action_dist_class
def build_sac_model_and_action_dist(policy, obs_space, action_space, config): model = build_sac_model(policy, obs_space, action_space, config) action_dist_class = get_dist_class(config, action_space) return model, action_dist_class