def __init__(self, args, env): self.noise = args.noise_eps self.epsilon = args.epsilon self.env = env self.agent = Agent(args) self.her_module = HerSampler(args.replay_strategy, args.replay_k, env.compute_reward) self.buffer = Buffer(args, self.her_module.sample_her_transitions) self.worker = RolloutWorker(self.env, self.agent, args) self.args = args
def __init__(self, args, env): self.args = args self.noise = args.noise_rate self.epsilon = args.epsilon self.episode_limit = args.max_episode_len self.env = env self.agents = self._init_agents() self.buffer = Buffer(args) self.save_path = self.args.save_dir + '/' + self.args.scenario_name if not os.path.exists(self.save_path): os.makedirs(self.save_path)