Exemple #1
0
 def rollout(self, timestep_limit, add_noise=True):
     rollout_rewards, rollout_length = policies.rollout(
         self.policy,
         self.env,
         timestep_limit=timestep_limit,
         add_noise=add_noise)
     return rollout_rewards, rollout_length
Exemple #2
0
 def rollout(self, timestep_limit, add_noise=True):
     rollout_rewards, rollout_length = policies.rollout(
         self.policy,
         self.env,
         timestep_limit=timestep_limit,
         add_noise=add_noise)
     return rollout_rewards, rollout_length