def __init__(self, name, pars, nrenvs=1, job=None, experiment=None): Agent.__init__(self, name, pars, nrenvs, job, experiment) self.coef_value = 0.5 self.ppo_steps = 5 self.clip_param = 0.2 self.max_grad_norm = 0.5 self.eps_threshold = 0.1 self.use_clipped_value_loss = True
def __init__(self, name, pars, nrenvs=1, job=None, experiment=None): Agent.__init__(self, name, pars, nrenvs, job, experiment) self.reset_hx()
def __init__(self, name, pars, nrenvs=1, job=None, experiment=None): Agent.__init__(self, name, pars, nrenvs, job, experiment) self.coef_value = 0.5
def __init__(self, name, pars, nrenvs=1, job=None, experiment=None): Agent.__init__(self, name, pars, nrenvs, job, experiment) bs = 1 self.h2 = torch.zeros(1, bs, pars['en'], device=self.device) self.h1 = torch.zeros(1, bs, pars['en'], device=self.device) self.rnnB = 10