示例#1
0
    def __init__(self, env: gym.Env):
        self.env = utils.torchenv(env)
        self.ep_rewards: List[float] = []

        self.actor_optimizer = Adam([])
        self.critic_optimizer = Adam([])
        self.replay: Replay = NoReplay(1)
示例#2
0
文件: dqn.py 项目: fkodom/metis
    def __init__(self, env: gym.Env):
        self.env = utils.torchenv(env)
        self.ep_rewards = []

        self.replay = None
        self.optimizer = None
        self.target_dqn = None
示例#3
0
    def __init__(self, env: gym.Env):
        self.env = utils.torchenv(env)
        self.ep_rewards: List[float] = []
        self.avg_reward = 0.0

        self.optimizer: Optimizer = Adam([])
        self.replay: Replay = NoReplay(1)
示例#4
0
    def __init__(self, env: gym.Env):
        self.env = utils.torchenv(env)
        self.ep_rewards = []

        self.replay = None
        self.critic_optimizer = None
        self.actor_optimizer = None
        self.target_critics = None