Python Agent.run_reps Examples

Programming Language: Python

Namespace/Package Name: agents.agent

Class/Type: Agent

Method/Function: run_reps

Examples at hotexamples.com: 3

Python Agent.run_reps - 3 examples found. These are the top rated real world Python examples of agents.agent.Agent.run_reps extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Agent(30)

__init__(16)

test(6)

act(3)

prediction_history(3)

reset(3)

run_reps(3)

train(3)

step(3)

get_action(2)

aggregate_history(2)

collect_reward(2)

rank_bet(2)

set_sim_t(2)

state_dict(1)

test_goal_prediction(1)

put_data(1)

restart_coloring(1)

reset_episode(1)

reward_for_action(1)

observe(1)

set_session(1)

set_sim_dt(1)

place_bet(1)

load_model(1)

noisy_eval(1)

apply_control_open_loop(1)

_init_fmm_map(1)

_init_obj_fn(1)

_init_planner(1)

_init_psc_objective(1)

_init_system_dynamics(1)

actions(1)

advantage(1)

calc_weights(1)

memorize(1)

cuda(1)

environment(1)

eval(1)

get_move(1)

infer(1)

init_actor_critic(1)

load_memory(1)

value(1)

Example #1

Show file

from environments.lqr import LQR
from models.simple import Simple
from policies.rand import RandomPolicy
from policies.normal import NormalPolicy
from utils.data import SARSDataset

random.seed(42)

environment = LQR(-1, 1)
policy_model_random = RandomPolicy(-2, 2)
policy_model_normal = NormalPolicy([1, 9, 1], [1.])
policy_model = policy_model_normal
value_model = Simple()

agent = Agent(environment, policy_model, value_model, verbose=True)
agent.run_reps(iterations=3)

state_space = np.arange(-2, 2.1, 0.1)
action_space = np.arange(-2, 2.1, 0.1)

# loop over state action pairs
observations = []
for state in state_space:
    for action in action_space:
        environment.state = state
        new_state, reward, _, _ = environment.step(action)
        observations.append({
            'prev_state': state,
            'action': action,
            'reward': reward,
            'new_state':new_state})

Example #2

Show file

File: atari.py Project: stefanknegt/REPS

import sys, os
sys.path.append(os.path.join(os.path.dirname(__file__), '..'))

from agents.agent import Agent
from environments.atari import AtariBreakout
from policies.rand import RandomPolicy
from policies.normal import NormalPolicy
from models.mlp import MLP

environment = AtariBreakout()
# policy_model = RandomPolicy(0, 3, is_discrete=True)
policy_model = NormalPolicy([128, 64, 1], 1.)
value_model = MLP([128, 64, 1])

agent = Agent(environment, policy_model, value_model, verbose=True)
agent.run_reps(exp_render=True)

Example #3

Show file

File: cartpole.py Project: stefanknegt/REPS

import torch
from agents.agent import Agent
from environments.lqr import LQR
from models.simple import Simple
from policies.rand import RandomPolicy
from policies.normal import NormalPolicy
from models.mlp import MLP
from utils.data import SARSDataset

import gym
from torch.nn import functional as F

environment = LQR(-1, 1)
policy_model_normal = NormalPolicy([1, 20, 45, 1], [4 for i in range(1)],
                                   activation=F.tanh)
policy_model = policy_model_normal
value_model = MLP([1, 20, 45, 1])

random.seed(42)
torch.manual_seed(42)
np.random.seed(42)
#environment.seed(42)

agent = Agent(environment, policy_model, value_model, verbose=True)
agent.run_reps(100,
               exp_timesteps=1000,
               exp_episodes=10,
               exp_render=False,
               val_epsilon=0.1,
               pol_lr=1e-2)