Ejemplo n.º 1
0
 def __init__(
     self, model=None, replay=None, actor_updater=None, critic_updater=None
 ):
     self.model = model or default_model()
     self.replay = replay or replays.Segment()
     self.actor_updater = actor_updater or \
         updaters.StochasticPolicyGradient()
     self.critic_updater = critic_updater or updaters.VRegression()
Ejemplo n.º 2
0
def default_replay():
    return replays.Segment(size=4096,
                           batch_iterations=80,
                           batch_size=None,
                           discount_factor=0.98,
                           trace_decay=0.97)