Python Agent.get_noise Examples

Programming Language: Python

Namespace/Package Name: agent.agent

Class/Type: Agent

Method/Function: get_noise

Examples at hotexamples.com: 3

Python Agent.get_noise - 3 examples found. These are the top rated real world Python examples of agent.agent.Agent.get_noise extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Agent(30)

act(15)

inventory(4)

expReplay(4)

__init__(4)

execute(3)

get_noise(3)

get_action(2)

egreedy_action(2)

act_fcnet(2)

act_ffnet(2)

inventory1(2)

at_goal(2)

init_broker(2)

collect_transition_data(2)

cuda(2)

get_greedy_action(1)

get_judgements(1)

get_losses(1)

get_next_action(1)

_build(1)

get_step_value(1)

get_stochastic_action(1)

handler(1)

get_exploration_policy(1)

history(1)

init_or_update_local(1)

isExit(1)

has_finished_episode(1)

fitnetwork(1)

get_epsilon_policy(1)

competition(1)

action_process(1)

append(1)

append_sample(1)

buy_inventory(1)

calculate_margin(1)

choose_action(1)

connect(1)

get_commands(1)

display_state(1)

do_predicted_play(1)

eval(1)

REPORTING_PERIOD(1)

exp_replay(1)

act_covnet(1)

getTDError(1)

isLoggedIn(1)

Example #1

Show file

import gc
import gym
from agent.agent import Agent


MAX_EPISODES = 5


env = gym.make('BipedalWalker-v2')
state_size = env.observation_space.shape[0]
action_size = env.action_space.shape[0]

agent = Agent(state_size, action_size)
state = env.reset()
for _ in range(int(1024)):
    action = agent(state) + agent.get_noise()
    next_state, reward, done, info = env.step(action)
    agent.append(state, action, reward, done, next_state)
    state = next_state
    if done:
        state = env.reset()


for _ep in range(MAX_EPISODES):
    state = env.reset()
    count = 0
    while True:
        count += 1
        # env.render()
        action = agent(state) + agent.get_noise()
        next_state, reward, done, info = env.step(action)

Example #2

Show file

MAX_EPISODES = 1000

# env = gym.make('BipedalWalker-v2')
env = gym.make("Pendulum-v0")
print(env.action_space.high)
print(env.action_space.low)
print(env.observation_space.high)
print(env.observation_space.low)

state_size = env.observation_space.shape[0]
action_size = env.action_space.shape[0]
agent = Agent(state_size, action_size, ACCESS_SIZE)

state = env.reset()
for _ in range(ACCESS_SIZE):
    action = np.clip(2 * agent(state) + agent.get_noise(), -2, 2)
    next_state, reward, done, info = env.step(action)
    agent.append(state, action, reward, done, next_state)
    state = next_state
    if done:
        state = env.reset()


def to_np(scale):
    return np.array([scale])


viz_reward = viz.line(X=to_np(0), Y=to_np(0))
time.sleep(1)
viz_length = viz.line(X=to_np(0), Y=to_np(0))

Example #3

Show file

File: train_viz_BipedalWalker.py Project: zzwlstarby/DeepLearningNotes

MAX_EPISODES = 1000

env = gym.make('BipedalWalker-v2')
print(env.action_space.high)
print(env.action_space.low)
print(env.observation_space.high)
print(env.observation_space.low)

state_size = env.observation_space.shape[0]
action_size = env.action_space.shape[0]
agent = Agent(state_size, action_size, ACCESS_SIZE)
agent.restore_models(1000)

state = env.reset()
for _ in range(ACCESS_SIZE):
    action = np.clip(agent(state) + agent.get_noise(), -1, 1)
    next_state, reward, done, info = env.step(action)
    agent.append(state, action, reward, done, next_state)
    state = next_state
    if done:
        state = env.reset()


def to_np(scale):
    return np.array([scale])


viz_reward = viz.line(X=to_np(0), Y=to_np(0))
time.sleep(1)
viz_length = viz.line(X=to_np(0), Y=to_np(0))