def update_eps(self, p_id, update_nr): self._eps[p_id] = rl_util.polynomial_decay( base=self._args.ddqn_args.eps_start, minimum=self._args.ddqn_args.eps_min, const=self._args.ddqn_args.eps_const, exponent=self._args.ddqn_args.eps_exponent, counter=update_nr)
def increment(self): self.global_iter_id += 1 self.eps = rl_util.polynomial_decay( base=self.ddqn_args.eps_start, const=self.ddqn_args.eps_const, exponent=self.ddqn_args.eps_exponent, minimum=self.ddqn_args.eps_min, counter=self.global_iter_id) self.antic = rl_util.polynomial_decay( base=self._t_prof.antic_start, const=self._t_prof.antic_const, exponent=self._t_prof.antic_exponent, minimum=self._t_prof.antic_min, counter=self.global_iter_id) if self.global_iter_id % 1000 == 0: self._log_eps() self._log_antic() return self.seat_id