Пример #1
0
    def __init__(
        self,
        action_selector: ActionSelector,
        action_space: list,
        mu: float = 0.0,
        theta: float = 0.15,
        max_sigma: float = 0.3,
        min_sigma: float = 0.3,
        decay_period: int = 100000,
    ):
        ActionSelector.__init__(self, action_selector.use_cuda)
        self.action_selector = action_selector
        self.mu = mu
        self.theta = theta
        self.sigma = max_sigma
        self.max_sigma = max_sigma
        self.min_sigma = min_sigma
        self.decay_period = decay_period
        self.action_min = self.action_selector.action_min
        self.action_max = self.action_selector.action_max
        self.action_dim = self.action_selector.action_dim

        self.exploration = True

        self._reset()
Пример #2
0
 def __init__(self,
              action_selector: ActionSelector,
              max_exploratory_steps: int = 1000):
     ActionSelector.__init__(self, action_selector.use_cuda)
     self.action_selector = action_selector
     self.exploration = self.action_selector.exploration
     self.max_exploratory_steps = max_exploratory_steps
Пример #3
0
    def __init__(self, action_selector: ActionSelector, mu: float,
                 sigma: float):
        ActionSelector.__init__(self, action_selector.use_cuda)
        self.action_selector = action_selector
        self.action_min = self.action_selector.action_min
        self.action_max = self.action_selector.action_max
        self.action_dim = self.action_selector.action_dim

        self.mu = mu
        self.sigma = sigma
        self.exploration = True
Пример #4
0
 def __init__(
     self,
     action_selector: ActionSelector,
     action_space: spaces.Discrete,
     hyper_params: DictConfig,
 ):
     ActionSelector.__init__(self, action_selector.use_cuda)
     self.action_selector = action_selector
     self.action_space = action_space
     self.eps = hyper_params.eps
     self.eps_final = hyper_params.eps_final
     self.eps_decay = (self.eps -
                       self.eps_final) / hyper_params.max_exploration_frame
Пример #5
0
 def __init__(self, device: str):
     ActionSelector.__init__(self, device)
Пример #6
0
 def __init__(self, action_dim: int, action_range: list, use_cuda: bool):
     ActionSelector.__init__(self, use_cuda)
     self.action_dim = action_dim
     self.action_min = np.array(action_range[0])
     self.action_max = np.array(action_range[1])
Пример #7
0
 def __init__(self, use_cuda: bool):
     ActionSelector.__init__(self, use_cuda)