def batch_generator(buffer: ptan.experience.ExperienceReplayBuffer, initial: int, batch_size: int): buffer.populate(initial) while True: buffer.populate(1) yield buffer.sample(batch_size)
def batch_generator(a_exp: ptan.experience.ExperienceSource, b_exp: ptan.experience.ExperienceSource, buffer: ptan.experience.ExperienceReplayBuffer, replay_initial: int, batch_size: int): for a_e, b_e in zip(a_exp, b_exp): buffer._add(a_e) buffer._add(b_e) if len(buffer) < replay_initial: continue yield buffer.sample(batch_size)
def batch_genartate(buffer: ptan.experience.ExperienceReplayBuffer, size): while True: buffer.populate(1) yield buffer.sample(size)