def __init__(self, max_time_steps, *args, **kwargs): super().__init__(*args, **kwargs) self.gamma = 0.99 self.entropy_coefficient = 0.001 self.value_coefficient = 0.5 self.max_gradient_norm = 0.5 self.rms_alpha = 0.99 self.rms_epsilon = 0.1 self.learning_rate = LinearSchedule(7e-4, 1e-10, max_time_steps) # Auxiliary config self.pc_gamma = 0.9 self.pc_weight = 0.05 self.vr_weight = 1.0 self.rp_weight = 1.0 # Must be initialized in child class self.num_processes = None self.num_steps = None self.env = None def not_initialized(*args, **kwargs): raise Exception('Not initialized') self._train = self._step = self._value = not_initialized
def __init__(self, max_time_steps, *args, **kwargs): super().__init__(*args, **kwargs) self.gamma = 0.99 self.entropy_coefficient = 0.001 self.value_coefficient = 0.25 self.max_gradient_norm = 0.5 self.learning_rate = 2e-4 self.clip_param = 0.1 self.ppo_epochs = 4 self.num_minibatches = 4 self.gae_lambda = 0.95 self.learning_rate = LinearSchedule(2e-4, 1e-10, max_time_steps) # Auxiliary config self.pc_gamma = 0.9 self.pc_weight = 0.0125 self.vr_weight = 0.0 self.rp_weight = 0.25 # Must be initialized in child class self.num_processes = None self.num_steps = None self.env = None def not_initialized(*args, **kwargs): raise Exception('Not initialized') self._train = self._step = self._value = not_initialized
def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) self.num_processes = 16 self.max_gradient_norm = 0.5 self.rms_alpha = 0.99 self.rms_epsilon = 1e-5 self.num_steps = 20 self.gamma = .99 self.allow_gpu = True self.learning_rate = LinearSchedule(7e-4, 0, self.max_time_steps)
def __init__(self, *args, **kwargs): super().__init__(*args, **kwargs) self.num_processes = 16 self.max_gradient_norm = 0.5 self.rms_alpha = 0.99 self.rms_epsilon = 1e-5 self.num_steps = 20 self.gamma = .99 self.allow_gpu = True self.learning_rate = LinearSchedule(7e-4, 0, self.max_time_steps) self.rp_weight = 1.0 self.pc_weight = 0.05 self.vr_weight = 1.0 self.auxiliary_weight = 0.1 #self.pc_cell_size = self.scene_complexity = MultistepSchedule( 0.3, [(5000000, LinearSchedule(0.3, 1.0, 5000000)), (10000000, 1.0)])