Exemple #1
0
def load(noise_scale, seed):
    """Load a bandit_noise experiment with the prescribed settings."""
    env = wrappers.RewardNoise(env=bandit.SimpleBandit(seed=seed),
                               noise_scale=noise_scale,
                               seed=seed)
    env.bsuite_num_episodes = sweep.NUM_EPISODES
    return env
Exemple #2
0
def load(mean_rewards=None, seed=None):
    """Load a bandit_noise experiment with the prescribed settings."""
    env = wrappers.RewardNoise(env=bandit.SimpleBandit(rewards=mean_rewards,
                                                       seed=seed),
                               bernoulli=True,
                               seed=seed)
    env.bsuite_num_episodes = sweep.NUM_EPISODES
    return env
Exemple #3
0
 def make_object_under_test(self):
     return bandit.SimpleBandit(5)
Exemple #4
0
 def make_object_under_test(self):
     return bandit.SimpleBandit(rewards=[0.1, 0.3, 0.7], seed=5)