Example #1
0
def create_majority_step_swarm():
    swarm = StepSwarm(
        model=lambda x: DiscreteUniform(env=x),
        env=cartpole_env,
        reward_limit=10,
        n_walkers=100,
        max_epochs=20,
        step_epochs=25,
    )
    return swarm
Example #2
0
def create_majority_step_swarm():
    swarm = StepSwarm(
        model=lambda x: DiscreteUniform(env=x),
        env=lambda: ParallelEnvironment(lambda: DiscreteEnv(ClassicControl())),
        reward_limit=10,
        n_walkers=100,
        max_epochs=20,
        step_epochs=25,
    )
    return swarm
Example #3
0
def create_follow_best_step_swarm():
    swarm = StepSwarm(
        root_model=FollowBestModel,
        model=lambda x: DiscreteUniform(env=x),
        env=cartpole_env,
        reward_limit=101,
        n_walkers=100,
        max_epochs=200,
        step_epochs=10,
    )
    return swarm
Example #4
0
def create_follow_best_step_swarm():
    swarm = StepSwarm(
        root_model=FollowBestModel,
        model=lambda x: DiscreteUniform(env=x),
        env=lambda: ParallelEnvironment(lambda: DiscreteEnv(ClassicControl())),
        reward_limit=15,
        n_walkers=100,
        max_epochs=15,
        step_epochs=25,
    )
    return swarm
Example #5
0
def create_follow_best_step_swarm_after_impr():
    swarm = StepSwarm(
        root_model=FollowBestModel,
        model=lambda x: DiscreteUniform(env=x),
        env=cartpole_env,
        reward_limit=101,
        n_walkers=10,  # 0,
        max_epochs=2,  # 200,
        step_epochs=2,  # 5,
        step_after_improvement=True,
    )
    return swarm
def create_follow_best_step_swarm_after_impr():
    swarm = StepSwarm(
        root_model=FollowBestModel,
        model=lambda x: DiscreteUniform(env=x),
        env=lambda: ParallelEnv(lambda: DiscreteEnv(
            ClassicControl("CartPole-v0"))),
        reward_limit=101,
        n_walkers=100,
        max_epochs=200,
        step_epochs=25,
        step_after_improvement=True,
    )
    return swarm