Esempio n. 1
0
    def __init__(self, max_time_steps, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.gamma = 0.99
        self.entropy_coefficient = 0.001
        self.value_coefficient = 0.5
        self.max_gradient_norm = 0.5
        self.rms_alpha = 0.99
        self.rms_epsilon = 0.1

        self.learning_rate = LinearSchedule(7e-4, 1e-10, max_time_steps)

        # Auxiliary config
        self.pc_gamma = 0.9
        self.pc_weight = 0.05

        self.vr_weight = 1.0
        self.rp_weight = 1.0

        # Must be initialized in child class
        self.num_processes = None
        self.num_steps = None
        self.env = None

        def not_initialized(*args, **kwargs):
            raise Exception('Not initialized')
        self._train = self._step = self._value = not_initialized
Esempio n. 2
0
    def __init__(self, max_time_steps, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.gamma = 0.99
        self.entropy_coefficient = 0.001
        self.value_coefficient = 0.25
        self.max_gradient_norm = 0.5

        self.learning_rate = 2e-4
        self.clip_param = 0.1
        self.ppo_epochs = 4
        self.num_minibatches = 4
        self.gae_lambda = 0.95

        self.learning_rate = LinearSchedule(2e-4, 1e-10, max_time_steps)

        # Auxiliary config
        self.pc_gamma = 0.9
        self.pc_weight = 0.0125

        self.vr_weight = 0.0
        self.rp_weight = 0.25

        # Must be initialized in child class
        self.num_processes = None
        self.num_steps = None
        self.env = None

        def not_initialized(*args, **kwargs):
            raise Exception('Not initialized')

        self._train = self._step = self._value = not_initialized
Esempio n. 3
0
 def __init__(self, *args, **kwargs):
     super().__init__(*args, **kwargs)
     self.num_processes = 16
     self.max_gradient_norm = 0.5
     self.rms_alpha = 0.99
     self.rms_epsilon = 1e-5
     self.num_steps = 20
     self.gamma = .99
     self.allow_gpu = True
     self.learning_rate = LinearSchedule(7e-4, 0, self.max_time_steps)
    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self.num_processes = 16
        self.max_gradient_norm = 0.5
        self.rms_alpha = 0.99
        self.rms_epsilon = 1e-5
        self.num_steps = 20
        self.gamma = .99
        self.allow_gpu = True
        self.learning_rate = LinearSchedule(7e-4, 0, self.max_time_steps)

        self.rp_weight = 1.0
        self.pc_weight = 0.05
        self.vr_weight = 1.0
        self.auxiliary_weight = 0.1
        #self.pc_cell_size =

        self.scene_complexity = MultistepSchedule(
            0.3, [(5000000, LinearSchedule(0.3, 1.0, 5000000)),
                  (10000000, 1.0)])