def create_majority_step_swarm(): swarm = StepSwarm( model=lambda x: DiscreteUniform(env=x), env=cartpole_env, reward_limit=10, n_walkers=100, max_epochs=20, step_epochs=25, ) return swarm
def create_majority_step_swarm(): swarm = StepSwarm( model=lambda x: DiscreteUniform(env=x), env=lambda: ParallelEnvironment(lambda: DiscreteEnv(ClassicControl())), reward_limit=10, n_walkers=100, max_epochs=20, step_epochs=25, ) return swarm
def create_follow_best_step_swarm(): swarm = StepSwarm( root_model=FollowBestModel, model=lambda x: DiscreteUniform(env=x), env=cartpole_env, reward_limit=101, n_walkers=100, max_epochs=200, step_epochs=10, ) return swarm
def create_follow_best_step_swarm(): swarm = StepSwarm( root_model=FollowBestModel, model=lambda x: DiscreteUniform(env=x), env=lambda: ParallelEnvironment(lambda: DiscreteEnv(ClassicControl())), reward_limit=15, n_walkers=100, max_epochs=15, step_epochs=25, ) return swarm
def create_follow_best_step_swarm_after_impr(): swarm = StepSwarm( root_model=FollowBestModel, model=lambda x: DiscreteUniform(env=x), env=cartpole_env, reward_limit=101, n_walkers=10, # 0, max_epochs=2, # 200, step_epochs=2, # 5, step_after_improvement=True, ) return swarm
def create_follow_best_step_swarm_after_impr(): swarm = StepSwarm( root_model=FollowBestModel, model=lambda x: DiscreteUniform(env=x), env=lambda: ParallelEnv(lambda: DiscreteEnv( ClassicControl("CartPole-v0"))), reward_limit=101, n_walkers=100, max_epochs=200, step_epochs=25, step_after_improvement=True, ) return swarm