Beispiel #1
0
 def rollout(self, timestep_limit, add_noise=False):
     rollout_rewards, rollout_length = policies.rollout(
         self.policy,
         self.env,
         timestep_limit=timestep_limit,
         add_noise=add_noise,
         offset=self.config['offset'])
     return rollout_rewards, rollout_length
Beispiel #2
0
 def rollout(self, timestep_limit, add_noise=False):
     rollout_rewards, rollout_length = policies.rollout(
         self.policy,
         self.env,
         timestep_limit=timestep_limit,
         add_noise=add_noise,
         offset=self.config['offset'])
     return rollout_rewards, rollout_length