def __init__( self, model=None, replay=None, actor_updater=None, critic_updater=None ): self.model = model or default_model() self.replay = replay or replays.Segment() self.actor_updater = actor_updater or \ updaters.StochasticPolicyGradient() self.critic_updater = critic_updater or updaters.VRegression()
def default_replay(): return replays.Segment(size=4096, batch_iterations=80, batch_size=None, discount_factor=0.98, trace_decay=0.97)