def rollout(self, timestep_limit, add_noise=False): rollout_rewards, rollout_length = policies.rollout( self.policy, self.env, timestep_limit=timestep_limit, add_noise=add_noise, offset=self.config['offset']) return rollout_rewards, rollout_length