示例#1
0
文件: a2c.py 项目: vittorione94/tonic
 def __init__(
     self, model=None, replay=None, actor_updater=None, critic_updater=None
 ):
     self.model = model or default_model()
     self.replay = replay or replays.Segment()
     self.actor_updater = actor_updater or \
         updaters.StochasticPolicyGradient()
     self.critic_updater = critic_updater or updaters.VRegression()
示例#2
0
文件: a2c.py 项目: seanahmad/tonic
def default_replay():
    return replays.Segment(size=4096,
                           batch_iterations=80,
                           batch_size=None,
                           discount_factor=0.98,
                           trace_decay=0.97)