def update_eps(self, p_id, update_nr):
     self._eps[p_id] = rl_util.polynomial_decay(
         base=self._args.ddqn_args.eps_start,
         minimum=self._args.ddqn_args.eps_min,
         const=self._args.ddqn_args.eps_const,
         exponent=self._args.ddqn_args.eps_exponent,
         counter=update_nr)
Esempio n. 2
0
    def increment(self):
        self.global_iter_id += 1

        self.eps = rl_util.polynomial_decay(
            base=self.ddqn_args.eps_start,
            const=self.ddqn_args.eps_const,
            exponent=self.ddqn_args.eps_exponent,
            minimum=self.ddqn_args.eps_min,
            counter=self.global_iter_id)
        self.antic = rl_util.polynomial_decay(
            base=self._t_prof.antic_start,
            const=self._t_prof.antic_const,
            exponent=self._t_prof.antic_exponent,
            minimum=self._t_prof.antic_min,
            counter=self.global_iter_id)

        if self.global_iter_id % 1000 == 0:
            self._log_eps()
            self._log_antic()
        return self.seat_id