Exemplos de nn.Module.act em Python

Linguagem de programação: Python

Espaço para nome / nome do pacote: torch

Classe / Tipo: nn.Module

Método / Função: act

Exemplos em hotexamples.com: 3

nn.Module.act em Python - 3 exemplos encontrados. Esses são os exemplos do mundo real mais bem avaliados de torch.nn.Module.act em Python extraídos de projetos de código aberto. Você pode avaliar os exemplos para nos ajudar a melhorar a qualidade deles.

Métodos Frequentes

Exibir Ocultar

__class__(6)

_get_name(4)

act(3)

_unwrapped_forward(2)

__getstate__(2)

_get_mapping(1)

_time_split_kwargs(1)

_original_get_state(1)

_modeling_hooks(1)

_make_tracing_inputs(1)

_load_from_state_dict(1)

_keep_memory(1)

CostType(1)

_flat_weights(1)

__batch_counter__(1)

_backpack_extend(1)

_auto_quant_module_hook_type(1)

_apply(1)

__mask__(1)

__flops_handle__(1)

__flops__(1)

__batch_counter_handle__(1)

_decoder(1)

Métodos Frequentes

__class__ (6)

_get_name (4)

act (3)

_unwrapped_forward (2)

__getstate__ (2)

_get_mapping (1)

_time_split_kwargs (1)

_original_get_state (1)

_modeling_hooks (1)

_make_tracing_inputs (1)

Métodos Frequentes

_load_from_state_dict (1)

_keep_memory (1)

CostType (1)

_flat_weights (1)

__batch_counter__ (1)

_backpack_extend (1)

_auto_quant_module_hook_type (1)

_apply (1)

__mask__ (1)

__flops_handle__ (1)

__flops__ (1)

__batch_counter_handle__ (1)

_decoder (1)

Métodos Frequentes

__flops__ (1)

__batch_counter_handle__ (1)

_decoder (1)

Exemplo n.º 1

0

Exibir arquivo

def perform_rollout(env: gym.Env, model: torch.nn.Module, gamma: float) -> Memory: memory = Memory(gamma, BATCH_SIZE) obs = env.reset() done = False while not done: obs = torch.unsqueeze(torch.FloatTensor(obs), dim=0) action, action_logprobs, state_value = model.act(obs) obs, rew, done, _ = env.step(int(action)) memory.update_actions(action) memory.update_action_logprobs(action_logprobs) memory.update_state_values(state_value) memory.update_rewards(torch.tensor(rew)) memory.update_is_terminals(torch.tensor(done, dtype=torch.uint8)) return memory

Exemplo n.º 2

0

Exibir arquivo

def collect_batch(env: gym.Env, actor: torch.nn.Module, buffer: Memory, batch_size: int, device: torch.device): while len(buffer) < batch_size: obs = env.reset() done = False obs = torch.tensor(obs, dtype=torch.float32, device=device) prev_idx = buffer.add_obs(obs) while not done: obs = torch.unsqueeze(obs, dim=0) action, action_logprobs = actor.act(obs) action = action.cpu().numpy()[0] obs, rew, done, _ = env.step(action) obs = torch.tensor(obs, dtype=torch.float32, device=device) next_idx = buffer.add_obs(obs) buffer.add_timestep(prev_idx, next_idx, action, action_logprobs, rew, done) prev_idx = next_idx buffer.end_rollout()

Exemplo n.º 3

0

Exibir arquivo

def act( flags, actor_index: int, free_queue: mp.SimpleQueue, full_queue: mp.SimpleQueue, model: torch.nn.Module, buffers: Buffers, initial_agent_state_buffers, ): try: logging.info("Actor %i started.", actor_index) timings = prof.Timings() # Keep track of how fast things are. gym_env = create_env(flags) seed = actor_index ^ int.from_bytes(os.urandom(4), byteorder="little") gym_env.seed(seed) env = environment.Environment(gym_env) env_output = env.initial() #agent_ model.initialize(env_output) agent_state = model.initialize(env_output, batch_size=1) agent_output, unused_state = model.act(env_output, agent_state) while True: index = free_queue.get() if index is None: break # Write old rollout end. for key in env_output: buffers[key][index][0, ...] = env_output[key] for key in agent_output: buffers[key][index][0, ...] = agent_output[key] for i, tensor in enumerate(agent_state["core_state"]): initial_agent_state_buffers[index][i][...] = tensor # Do new rollout. for t in range(flags.unroll_length): timings.reset() with torch.no_grad(): agent_output, agent_state = model.act( env_output, agent_state) timings.time("model") env_output = env.step(agent_output["action"]) timings.time("step") for key in env_output: buffers[key][index][t + 1, ...] = env_output[key] for key in agent_output: buffers[key][index][t + 1, ...] = agent_output[key] timings.time("write") full_queue.put(index) if actor_index == 0: logging.info("Actor %i: %s", actor_index, timings.summary()) except KeyboardInterrupt: pass # Return silently. except Exception as e: logging.error("Exception in worker process %i", actor_index) traceback.print_exc() print() raise e