Python Environment.action_outcome Exemples

Langage de programmation: Python

Espace de nommage/Pack: environment

Class/Type: Environment

Méthode/Fonction: action_outcome

Exemples au hotexamples.com: 2

Python Environment.action_outcome - 2 exemples trouvés. Ce sont les exemples réels les mieux notés de environment.Environment.action_outcome extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

_max_int(30)

set_value(30)

add_ids_to_frame(30)

Environment(30)

_min_int(30)

get_value(22)

act(13)

action_size(8)

__init__(7)

action_space(4)

add_agent(3)

add_object(3)

add_plane(3)

add(3)

Quit(3)

cross(3)

CodeRunner(3)

relations(2)

_step(2)

GetViruses(2)

setCurrentState(2)

action_outcome(2)

select(2)

add_obstacle(2)

MnistDataset(2)

hasher(2)

add_door(2)

immigrate(2)

AllTests(2)

nextStep(2)

mutate(2)

_reset(2)

is_development(2)

Test(2)

add_target(2)

State(2)

WorkingTests(2)

Shared(2)

START_NEW_GAME(2)

getP_grid(2)

get_lambda_type_by_node(2)

Reward(2)

_get_obs(2)

init_done(1)

getostype(1)

init_population(1)

getPath(1)

init_state_on_stack(1)

getTons(1)

getSolar(1)

Méthodes fréquemment utilisées

_max_int (30)

set_value (30)

add_ids_to_frame (30)

Environment (30)

_min_int (30)

get_value (22)

act (13)

action_size (8)

__init__ (7)

action_space (4)

Méthodes fréquemment utilisées

add_agent (3)

add_object (3)

add_plane (3)

add (3)

Quit (3)

cross (3)

CodeRunner (3)

relations (2)

_step (2)

GetViruses (2)

setCurrentState (2)

action_outcome (2)

select (2)

add_obstacle (2)

MnistDataset (2)

hasher (2)

add_door (2)

immigrate (2)

AllTests (2)

nextStep (2)

Méthodes fréquemment utilisées

setCurrentState (2)

action_outcome (2)

select (2)

add_obstacle (2)

MnistDataset (2)

hasher (2)

add_door (2)

immigrate (2)

AllTests (2)

nextStep (2)

mutate (2)

_reset (2)

is_development (2)

Test (2)

add_target (2)

State (2)

WorkingTests (2)

Shared (2)

START_NEW_GAME (2)

getP_grid (2)

get_lambda_type_by_node (2)

Reward (2)

_get_obs (2)

init_done (1)

getostype (1)

init_population (1)

getPath (1)

init_state_on_stack (1)

getTons (1)

getSolar (1)

Méthodes fréquemment utilisées

mutate (2)

_reset (2)

is_development (2)

Test (2)

add_target (2)

State (2)

WorkingTests (2)

Shared (2)

START_NEW_GAME (2)

getP_grid (2)

get_lambda_type_by_node (2)

Reward (2)

_get_obs (2)

init_done (1)

getostype (1)

init_population (1)

getPath (1)

init_state_on_stack (1)

getTons (1)

getSolar (1)

has_next (1)

list_repos (1)

getosfamily (1)

generateRandom (1)

get_packages (1)

get_controller (1)

getAverageRatio (1)

get_variable (1)

getInstance (1)

get_var (1)

getRepositories (1)

get_macros (1)

get_repo (1)

get_observation_for_target (1)

getLoad (1)

AddAgent (1)

load_interactive (1)

sort_results (1)

set_search_dir (1)

set_stats (1)

Exemple #1

0

Afficher le fichier

Fichier : search.py Projet : devdnhee/rookie

def alphabeta_dtm(sp, a, s, depth, alpha, beta): """ alpha beta pruning on a ground truth dtm params: sp: previous state a: action s: current state depth: depth of search alpha beta returns: max_a: best action max_score: score of this action """ if depth == 0: ep = Environment(sp) return None, -map_side_to_int(ep.get_turn()) * ep.action_outcome(a) elif depth == 1: e = Environment(s) as_pairs = e.get_as_pairs() outcomes = [ -0.5 * map_side_to_int(e.get_turn()) * e.action_outcome(an) for (an, sn) in as_pairs ] max_o = max(outcomes) rand = outcomes.index(max_o) return as_pairs[rand][0], max_o else: best_an = None e = Environment(s) as_pairs = e.get_as_pairs() for (an, sn) in as_pairs: score = -0.5 * alphabeta_dtm(s, an, sn, depth - 1, -beta, -alpha)[1] if score >= beta: return an, beta elif score > alpha: alpha = score best_an = an return best_an, alpha

Exemple #2

0

Afficher le fichier

Fichier : search.py Projet : devdnhee/rookie

def alphabeta_outcome(sp, a, s, depth, alpha, beta): """ alpha beta pruning on a ground truth outcome params: sp: previous state a: action s: current state depth: depth of search alpha beta returns: max_a: best action max_score: score of this action """ if depth < 1: env = Environment(sp) env.perform_action(a) o = map_side_to_int(env.get_turn()) * env.int_outcome() #print o return None, o env = Environment(s) as_pairs = env.get_as_pairs() if len(as_pairs) == 0: env = Environment(sp) env.perform_action(a) o = map_side_to_int(env.get_turn()) * env.int_outcome() #print o return None, o if depth == 1: outcomes = [ 0.5 * map_side_to_int(env.get_turn()) * env.action_outcome(a) for (a, sn) in as_pairs ] best = np.argmax(np.array(outcomes)) best_o = outcomes[best] return as_pairs[best][0], best_o act = None for (a, sn) in as_pairs: score = -0.5 * alphabeta_outcome(s, a, sn, depth - 1, -beta, -alpha)[1] if score >= beta: return a, beta elif score > alpha: alpha = score act = a return act, alpha