Python Agent.get_noiseの例

プログラミング言語: Python

名前空間/パッケージ名: agent.agent

クラス/型: Agent

メソッド/関数: get_noise

hotexamples.comのコード掲載数: 3

Python Agent.get_noise - 3件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのagent.agent.Agent.get_noiseの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Agent(30)

act(15)

inventory(4)

expReplay(4)

__init__(4)

execute(3)

get_noise(3)

get_action(2)

egreedy_action(2)

act_fcnet(2)

act_ffnet(2)

inventory1(2)

at_goal(2)

init_broker(2)

collect_transition_data(2)

cuda(2)

get_greedy_action(1)

get_judgements(1)

get_losses(1)

get_next_action(1)

_build(1)

get_step_value(1)

get_stochastic_action(1)

handler(1)

get_exploration_policy(1)

history(1)

init_or_update_local(1)

isExit(1)

has_finished_episode(1)

fitnetwork(1)

get_epsilon_policy(1)

competition(1)

action_process(1)

append(1)

append_sample(1)

buy_inventory(1)

calculate_margin(1)

choose_action(1)

connect(1)

get_commands(1)

display_state(1)

do_predicted_play(1)

eval(1)

REPORTING_PERIOD(1)

exp_replay(1)

act_covnet(1)

getTDError(1)

isLoggedIn(1)

コード例 #1

ファイルを表示

import gc
import gym
from agent.agent import Agent


MAX_EPISODES = 5


env = gym.make('BipedalWalker-v2')
state_size = env.observation_space.shape[0]
action_size = env.action_space.shape[0]

agent = Agent(state_size, action_size)
state = env.reset()
for _ in range(int(1024)):
    action = agent(state) + agent.get_noise()
    next_state, reward, done, info = env.step(action)
    agent.append(state, action, reward, done, next_state)
    state = next_state
    if done:
        state = env.reset()


for _ep in range(MAX_EPISODES):
    state = env.reset()
    count = 0
    while True:
        count += 1
        # env.render()
        action = agent(state) + agent.get_noise()
        next_state, reward, done, info = env.step(action)

コード例 #2

ファイルを表示

MAX_EPISODES = 1000

# env = gym.make('BipedalWalker-v2')
env = gym.make("Pendulum-v0")
print(env.action_space.high)
print(env.action_space.low)
print(env.observation_space.high)
print(env.observation_space.low)

state_size = env.observation_space.shape[0]
action_size = env.action_space.shape[0]
agent = Agent(state_size, action_size, ACCESS_SIZE)

state = env.reset()
for _ in range(ACCESS_SIZE):
    action = np.clip(2 * agent(state) + agent.get_noise(), -2, 2)
    next_state, reward, done, info = env.step(action)
    agent.append(state, action, reward, done, next_state)
    state = next_state
    if done:
        state = env.reset()


def to_np(scale):
    return np.array([scale])


viz_reward = viz.line(X=to_np(0), Y=to_np(0))
time.sleep(1)
viz_length = viz.line(X=to_np(0), Y=to_np(0))

コード例 #3

ファイルを表示

ファイル: train_viz_BipedalWalker.py プロジェクト: zzwlstarby/DeepLearningNotes

MAX_EPISODES = 1000

env = gym.make('BipedalWalker-v2')
print(env.action_space.high)
print(env.action_space.low)
print(env.observation_space.high)
print(env.observation_space.low)

state_size = env.observation_space.shape[0]
action_size = env.action_space.shape[0]
agent = Agent(state_size, action_size, ACCESS_SIZE)
agent.restore_models(1000)

state = env.reset()
for _ in range(ACCESS_SIZE):
    action = np.clip(agent(state) + agent.get_noise(), -1, 1)
    next_state, reward, done, info = env.step(action)
    agent.append(state, action, reward, done, next_state)
    state = next_state
    if done:
        state = env.reset()


def to_np(scale):
    return np.array([scale])


viz_reward = viz.line(X=to_np(0), Y=to_np(0))
time.sleep(1)
viz_length = viz.line(X=to_np(0), Y=to_np(0))