def __init__(self, env_name, rand_seed, misc_info): super(env, self).__init__(env_name, rand_seed, misc_info) self._base_path = init_path.get_abs_base_dir() self._use_pets_reward = 'pets' in misc_info and misc_info['pets'] self._len_qpos, self._len_qvel = \ env_util.get_gym_q_info(self._env, self._current_version) self._done_counter = -1 # return the reset as the gym? if 'reset_type' in misc_info and misc_info['reset_type'] == 'gym': self._reset_return_obs_only = True self.observation_space, self.action_space = \ self._env.observation_space, self._env.action_space # it's possible some environments have different obs self.observation_space = \ env_util.box(self._env_info['ob_size'], -1, 1) else: self._reset_return_obs_only = False if 'no_termination' in misc_info and misc_info['no_termination']: self._no_termination = True else: self._no_termination = False
def __init__(self, env_name, rand_seed, misc_info): super(env, self).__init__(env_name, rand_seed, misc_info) self._base_path = init_path.get_abs_base_dir() self._use_pets_reward = 'pets' in misc_info and misc_info['pets'] self._len_qpos, self._len_qvel = \ env_util.get_gym_q_info(self._env, self._current_version) # return the reset as the gym? if 'reset_type' in misc_info and misc_info['reset_type'] == 'gym': self._reset_return_obs_only = True self.observation_space, self.action_space = \ self._env.observation_space, self._env.action_space # it's possible some environments have different obs self.observation_space = \ env_util.box(self._env_info['ob_size'], -1, 1) else: self._reset_return_obs_only = False if self._env_name == 'gym_cheetahO01': self._action_noise = 0.0 self._ob_noise = 0.1 elif self._env_name == 'gym_cheetahO001': self._action_noise = 0.0 self._ob_noise = 0.01 elif self._env_name == 'gym_cheetahA01': self._action_noise = 0.1 self._ob_noise = 0.0 elif self._env_name == 'gym_cheetahA003': self._action_noise = 0.03 self._ob_noise = 0.0
def __init__(self, env_name, rand_seed, misc_info): super(env, self).__init__(env_name, rand_seed, misc_info) self._base_path = init_path.get_abs_base_dir() # return the reset as the gym? if 'reset_type' in misc_info and misc_info['reset_type'] == 'gym': self._reset_return_obs_only = True self.observation_space, self.action_space = \ self._env.observation_space, self._env.action_space # it's possible some environments have different obs self.observation_space = \ env_util.box(self._env_info['ob_size'], -1, 1) else: self._reset_return_obs_only = False
def __init__(self, env_name, rand_seed, misc_info): assert env_name in ['gym_humanoid', 'gym_slimhumanoid', 'gym_nostopslimhumanoid'] super(env, self).__init__(env_name, rand_seed, misc_info) self._base_path = init_path.get_abs_base_dir() self._len_qpos, self._len_qvel = \ env_util.get_gym_q_info(self._env, self._current_version) # return the reset as the gym? if 'reset_type' in misc_info and misc_info['reset_type'] == 'gym': self._reset_return_obs_only = True self.observation_space, self.action_space = \ self._env.observation_space, self._env.action_space # it's possible some environments have different obs self.observation_space = \ env_util.box(self._env_info['ob_size'], -1, 1) else: self._reset_return_obs_only = False
def __init__(self, env_name, rand_seed, misc_info): super(env, self).__init__(env_name, rand_seed, misc_info) self._base_path = init_path.get_abs_base_dir() # return the reset as the gym? if 'reset_type' in misc_info and misc_info['reset_type'] == 'gym': self._reset_return_obs_only = True self.observation_space, self.action_space = \ self._env.observation_space, self._env.action_space # it's possible some environments have different obs self.action_space = spaces.Box( low=np.array([-1.0]), high=np.array([1.0]), # dtype=np.float32 ) self.observation_space = \ env_util.box(self._env_info['ob_size'], -1, 1) else: self._reset_return_obs_only = False if self._env_name == 'gym_cartpoleO001': self._ob_noise = 0.01 elif self._env_name == 'gym_cartpoleO01': self._ob_noise = 0.1
def __init__(self, env_name, rand_seed, misc_info): super(env, self).__init__(env_name, rand_seed, misc_info) self._base_path = init_path.get_abs_base_dir() # return the reset as the gym? if 'reset_type' in misc_info and misc_info['reset_type'] == 'gym': self._reset_return_obs_only = True self.observation_space, self.action_space = \ self._env.observation_space, self._env.action_space # it's possible some environments have different obs self.observation_space = \ env_util.box(self._env_info['ob_size'], -1, 1) # note: we always set the action to range with in [-1, 1] self.action_space.low[:] = -1.0 self.action_space.high[:] = 1.0 else: self._reset_return_obs_only = False if self._env_name == 'gym_pendulumO001': self._ob_noise = 0.01 elif self._env_name == 'gym_pendulumO01': self._ob_noise = 0.1