def env_fn(**kwargs): env = raw_env(**kwargs) env = wrappers.AssertOutOfBoundsWrapper(env) backup_policy = "taking zero action (no movement, no attack)" env = wrappers.NanNoOpWrapper(env, 0, backup_policy) env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) example_space = list(env.action_spaces.values())[0] env = wrappers.AssertOutOfBoundsWrapper(env) env = wrappers.NanNoOpWrapper(env, np.zeros(example_space.shape, dtype=example_space.dtype), "taking all zeros action") env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) env = wrappers.TerminateIllegalWrapper(env, illegal_reward=-1) env = wrappers.AssertOutOfBoundsWrapper(env) env = wrappers.NanNoOpWrapper(env, 26**2 * 2, "executing the 'do nothing' action.") env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) env = wrappers.AssertOutOfBoundsWrapper(env) default_val = 1 env = wrappers.NanNoOpWrapper(env, default_val, "setting action to 1") env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) pass_move = env._N * env._N env = wrappers.TerminateIllegalWrapper(env, illegal_reward=-1) env = wrappers.AssertOutOfBoundsWrapper(env) env = wrappers.NanNoOpWrapper(env, pass_move, "passing turn with action {}".format(pass_move)) env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) env = wrappers.TerminateIllegalWrapper(env, illegal_reward=-1) env = wrappers.AssertOutOfBoundsWrapper(env) pass_action = 3 env = wrappers.NanNoOpWrapper(env, pass_action, "'checked' with action {}".format(pass_action)) env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) default_val = np.zeros((1, )) if env.continuous else 1 env = wrappers.AssertOutOfBoundsWrapper(env) env = wrappers.NanNoOpWrapper(env, default_val, "setting action to {}".format(default_val)) env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) env = wrappers.CaptureStdoutWrapper(env) env = wrappers.TerminateIllegalWrapper(env, illegal_reward=-1) env = wrappers.AssertOutOfBoundsWrapper(env) pass_move = 308 env = wrappers.NanNoOpWrapper(env, pass_move, "passing turn with action number {}".format(pass_move)) env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) world = env.world env = wrappers.AssertOutOfBoundsWrapper(env) backup_policy = "taking zero action (no movement, communication 0)" env = wrappers.NanNoOpWrapper(env, 0, backup_policy) env = wrappers.OrderEnforcingWrapper(env) env.world = world return env
def env(**kwargs): env = raw_env(**kwargs) if env.continuous: default_val = np.zeros((1, )) env = wrappers.ClipOutOfBoundsWrapper(env) else: default_val = 0 env = wrappers.AssertOutOfBoundsWrapper(env) env = wrappers.NanNoOpWrapper(env, default_val, "setting action to 0") env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) env = wrappers.AssertOutOfBoundsWrapper(env) env = wrappers.NanNoOpWrapper(env, 0, "doing nothing") env = wrappers.OrderEnforcingWrapper(env) return env
def env(**kwargs): env = raw_env(**kwargs) env = wrappers.AssertOutOfBoundsWrapper(env) env = wrappers.NanNoOpWrapper(env, 0, "setting action to 0") env = wrappers.OrderEnforcingWrapper(env) return env