def select_actions( self, observations: Dict[str, types.NestedArray] ) -> Dict[str, types.NestedArray]: return { agent: _generate_from_spec(self._spec[agent].actions) for agent, observation in observations.items() }
def select_action(self, agent: str, observation: types.NestedArray) -> Union[float, int]: return _generate_from_spec(self._spec[agent].actions)
def _generate_fake_discount(self) -> types.NestedArray: return _generate_from_spec(self._specs[self.agent_selection].discounts)
def _generate_fake_observation(self) -> Observation: return _generate_from_spec(self.observation_spec())
def _generate_fake_reward(self) -> types.NestedArray: return _generate_from_spec(self._specs[self.agent_selection].rewards)