def rollout(self, timestep_limit, add_noise=True): rollout_rewards, rollout_length = policies.rollout( self.policy, self.env, timestep_limit=timestep_limit, add_noise=add_noise) return rollout_rewards, rollout_length