Python weighted_sample Exemples

Langage de programmation: Python

Espace de nommage/Pack: rllab.misc.special

Méthode/Fonction: weighted_sample

Exemples au hotexamples.com: 8

Python weighted_sample - 8 exemples trouvés. Ce sont les exemples réels les mieux notés de rllab.misc.special.weighted_sample extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Associées

count_beans

turn

GameInitializer

editor

ortho2

setup_all

pwm_micro

DB

init_processor

add_file

Related in langs

formbuilder_send_email (PHP)

Gastos (PHP)

ExplorationSetClass (C#)

CWE191_Integer_Underflow__UInt64_console_ReadLine_sub_68b (C#)

reverseDirection (C++)

ha_replica_set_wait_for_healthy (C++)

NewLTIVersion (Go)

RectSize (Go)

WidgetUtil (Java)

ErmCodeDb (Java)

Exemple #1

0

Afficher le fichier

def step(self, action): # self.forward_dynamics(action) # comvel = self.get_body_comvel("torso") # forward_reward = self.goal_direction*comvel[0] # lb, ub = self.action_bounds # scaling = (ub - lb) * 0.5 # ctrl_cost = 0.5 * 1e-2 * np.sum(np.square(action / scaling)) # contact_cost = 0.5 * 1e-3 * np.sum( # np.square(np.clip(self.model.data.cfrc_ext, -1, 1))), # survive_reward = 0.05 # reward = forward_reward - ctrl_cost - contact_cost + survive_reward # state = self._state # notdone = np.isfinite(state).all() \ # and state[2] >= 0.2 and state[2] <= 1.0 # done = not notdone # ob = self.get_current_obs() # return Step(ob, float(reward), done) # obs = self.get_current_obs() # selected_arm_mean = self.arm_means[action] # reward = float(np.random.random() < selected_arm_mean) # self.ts += 1 # done = self.ts >= self.max_path_length # state = np.zeros((2)) # state[0] = reward # state[1] = 1 # return Step(state, reward, done) ps = self.Ps[self.state, action] next_state = special.weighted_sample(ps, np.arange(self.n_states)) reward_mean = self.Rs[self.state, action] reward = reward_mean + np.random.normal() * 1 / np.sqrt(self.tau) self.ts += 1 self.state = next_state done = self.ts >= self.max_path_length state = np.zeros((2 + self.n_states)) state[self.state] = 1 state[self.n_states] = reward state[self.n_states + 1] = done return Step(state, reward, done)

Exemple #2

0

Afficher le fichier

Fichier : categorical_gru_policy.py Projet : sushuang9210/GAIL_LSTM

def get_action(self, observation): if self.state_include_action: if self.prev_action is None: prev_action = np.zeros((self.action_space.flat_dim,)) else: prev_action = self.action_space.flatten(self.prev_action) all_input = np.concatenate([ self.observation_space.flatten(observation), prev_action ]) else: all_input = self.observation_space.flatten(observation) # should not be used prev_action = np.nan probs, hidden_vec = [x[0] for x in self.f_step_prob([all_input], [self.prev_hidden])] action = special.weighted_sample(probs, range(self.action_space.n)) self.prev_action = action self.prev_hidden = hidden_vec agent_info = dict(prob=probs) if self.state_include_action: agent_info["prev_action"] = prev_action return action, agent_info

Exemple #3

0

Afficher le fichier

Fichier : discrete.py Projet : yaohuic/accel_rl

def weighted_sample(self, weights): return special.weighted_sample(weights, self._items_arr)

Exemple #4

0

Afficher le fichier

Fichier : discrete.py Projet : AtousaTorabi/rllab

def weighted_sample(self, weights): return special.weighted_sample(weights, xrange(self.n))

Exemple #5

0

Afficher le fichier

def weighted_sample(self, weights): return special.weighted_sample(weights, range(self.n))

Exemple #6

0

Afficher le fichier

Fichier : discrete.py Projet : yoshihikokuwahara/gail-driver

def weighted_sample(self, weights): if config.TF_NN_SETTRACE: ipdb.set_trace() return special.weighted_sample(weights, range(self.n))

Exemple #7

0

Afficher le fichier

Fichier : product.py Projet : thuang/voltvar_package

def weighted_sample_normalized(self, weights): return [ (special.weighted_sample(weights[s:s + n], range(n)) - b) / b for s, n, b in zip(self._slice, self._comp_dim, self._comp_base) ]

Exemple #8

0

Afficher le fichier

Fichier : product.py Projet : thuang/voltvar_package

def weighted_sample(self, weights): return [ special.weighted_sample(weights[s:s + n], range(n)) for s, n, b in zip(self._slice, self._comp_dim, self._comp_base) ]