Exemplos de Net.action em Python

Linguagem de programação: Python

Espaço para nome / nome do pacote: net

Classe / Tipo: Net

Método / Função: action

Exemplos em hotexamples.com: 2

Net.action em Python - 2 exemplos encontrados. Esses são os exemplos do mundo real mais bem avaliados de net.Net.action em Python extraídos de projetos de código aberto. Você pode avaliar os exemplos para nos ajudar a melhorar a qualidade deles.

Métodos Frequentes

Exibir Ocultar

add(11)

Net(7)

build(6)

backward(5)

addVertex(4)

add_rank3_input_layer(3)

build_net(3)

accuracy(3)

calculate_outputs(3)

cal_err_out(2)

cal_out(2)

cal_err_term(2)

add_layer(2)

add_fc_layer(2)

add_flatten_layer(2)

add_datum(2)

add_conv_layer(2)

action(2)

__init__(2)

get_states(2)

blocks(2)

GAN_G(2)

add_softmax_layer(2)

cal_link_loss(1)

cal_dw(1)

AddLayer(1)

cal_loss(1)

calculate_conflicts(1)

calculate_next_diagnosis(1)

check_consistency(1)

classify(1)

clear_data(1)

return_stats(1)

build_model_GAN(1)

animate_last_sim(1)

build_model(1)

add_node(1)

PNet(1)

SGD(1)

acc_f1(1)

activate(1)

add_edge(1)

add_max_pool_layer(1)

add_output_layer(1)

bound_constrain(1)

add_rank3output_layer(1)

addmember(1)

AddOutputBlob(1)

apply(1)

base_url(1)

Métodos Frequentes

add (11)

Net (7)

build (6)

backward (5)

addVertex (4)

add_rank3_input_layer (3)

build_net (3)

accuracy (3)

calculate_outputs (3)

cal_err_out (2)

Métodos Frequentes

cal_out (2)

cal_err_term (2)

add_layer (2)

add_fc_layer (2)

add_flatten_layer (2)

add_datum (2)

add_conv_layer (2)

action (2)

__init__ (2)

get_states (2)

blocks (2)

GAN_G (2)

add_softmax_layer (2)

cal_link_loss (1)

cal_dw (1)

AddLayer (1)

cal_loss (1)

calculate_conflicts (1)

calculate_next_diagnosis (1)

check_consistency (1)

Métodos Frequentes

blocks (2)

GAN_G (2)

add_softmax_layer (2)

cal_link_loss (1)

cal_dw (1)

AddLayer (1)

cal_loss (1)

calculate_conflicts (1)

calculate_next_diagnosis (1)

check_consistency (1)

classify (1)

clear_data (1)

return_stats (1)

build_model_GAN (1)

animate_last_sim (1)

build_model (1)

add_node (1)

PNet (1)

SGD (1)

acc_f1 (1)

activate (1)

add_edge (1)

add_max_pool_layer (1)

add_output_layer (1)

bound_constrain (1)

add_rank3output_layer (1)

addmember (1)

AddOutputBlob (1)

apply (1)

base_url (1)

Métodos Frequentes

classify (1)

clear_data (1)

return_stats (1)

build_model_GAN (1)

animate_last_sim (1)

build_model (1)

add_node (1)

PNet (1)

SGD (1)

acc_f1 (1)

activate (1)

add_edge (1)

add_max_pool_layer (1)

add_output_layer (1)

bound_constrain (1)

add_rank3output_layer (1)

addmember (1)

AddOutputBlob (1)

apply (1)

base_url (1)

best_w (1)

bind_call (1)

set_user_agent (1)

Exemplo n.º 1

0

Exibir arquivo

class Agent: def __init__(self, env, config, wt): self.C = config self.n_state = list(env.observation_space.shape) self.n_action = env.action_space.n self.epsilon = 0.99 self.lr = 1e-3 self.wt = wt self.buffer = ReplayBuffer(self.C['max_size'], self.C['frame_stack']) self.buffer2 = ReplayBuffer(self.C['max_size'], self.C['frame_stack']) self.net = Net(self.n_state, self.n_action, self.C, self.wt) #Random action during Practice def act_pre(self): a = np.random.randint(self.n_action) return a #Epsilon greedy action selection function def act(self, s): a = self.greedy_act( s) if np.random.random() > self.epsilon else np.random.randint( self.n_action) return a def greedy_act(self, s): return self.net.action(s) #Practice without recording experiences def practice(self): self.lr = 1e-3 #possible self.net.pre_train(self.buffer, self.lr) #Records experiences and calls training functions def record(self, s, a, r, d, it, pre): #Variable pre is used to differentiate practice from RL training. if pre: self.buffer.append(s, a, r, d) if it > self.C['pre_training_start']: if it % self.C['pre_train_freq'] == 0: self.lr = 1e-3 self.net.pre_train(self.buffer, self.lr) else: self.buffer.append(s, a, r, d) if it <= 5e5: self.epsilon = linear_interp(0, 5e5, it, 0.1, 1.0) else: self.epsilon = max(linear_interp(5e5, 10e6, it, 0.01, 0.1), 0.01) if it > self.C['training_start']: if it % self.C['train_freq'] == 0: self.lr = 1e-4 #Learning rate for RL training self.net.train(self.buffer, self.lr) if it % self.C['update_target_freq'] == 0: self.net.update_target_network()

Exemplo n.º 2

0

Exibir arquivo

Arquivo: agent.py Projeto: Upasana23/DQN-experiments

class Agent: def __init__(self, env, config, wt): self.C = config self.n_state = list(env.observation_space.shape) self.n_action = env.action_space.n self.epsilon = 0.99 self.lr = 1e-3 self.wt = wt self.buffer = ReplayBuffer(self.C['max_size'], self.C['frame_stack']) self.buffer2 = ReplayBuffer(self.C['max_size'], self.C['frame_stack']) self.net = Net(self.n_state, self.n_action, self.C, self.wt) def act_pre(self): a = np.random.randint(self.n_action) return a def act(self, s): a = self.greedy_act( s) if np.random.random() > self.epsilon else np.random.randint( self.n_action) return a def greedy_act(self, s): return self.net.action(s) def record(self, s, a, r, d, it, pre): if pre: self.buffer.append(s, a, r, d) if it > self.C['pre_training_start']: if it % self.C['pre_train_freq'] == 0: self.lr = 1e-3 #possible self.net.pre_train(self.buffer, self.lr) else: self.buffer.append(s, a, r, d) if it <= 6e5: self.epsilon = linear_interp(0, 6e5, it, 0.1, 1.0) else: self.epsilon = max(linear_interp(6e5, 10e6, it, 0.01, 0.1), 0.01) if it > self.C['training_start']: if it % self.C['train_freq'] == 0: self.lr = 1e-4 self.net.train(self.buffer, self.lr) # print(Q) if it % self.C['update_target_freq'] == 0: self.net.update_target_network()