Python Agent.reset 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: agents

클래스/타입: Agent

메소드/함수: reset

hotexamples.com에서의 예제들: 2

Python Agent.reset - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 agents.Agent.reset에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Agent(30)

run_episode(4)

act(4)

__init__(3)

name(3)

get_move(3)

eval(3)

mark(2)

move(2)

get_action(2)

from_conf(2)

reset(2)

learn(2)

test(2)

build_trajectories(2)

ships(1)

log_activity_active(1)

log_activity_idle(1)

update_t_pref(1)

update_belief(1)

train_model(1)

train(1)

on(1)

parameters(1)

ppo_update(1)

precepts(1)

symbol(1)

set_train_mode(1)

stop(1)

preference_position(1)

step(1)

program(1)

state(1)

load_curve_certificate(1)

start(1)

sample_duration_current_state(1)

save(1)

set_current_activity_end(1)

reset_graph_info(1)

input_vector(1)

load(1)

choose_state(1)

ac_model(1)

add_actuator(1)

add_event(1)

add_id(1)

add_sensor(1)

append_sample(1)

bombs_left(1)

예제 #1

파일 보기

파일: __init__.py 프로젝트: avelkoski/VacuumAI

class Simulation(object):
    def __init__(self,location,shape,plot):
        self.location = location
        self.shape = shape
        self.plot = plot
        self.env = Environment(self.shape)
        self.agent = Agent()
        self.child = Child(self.env.state)

    def run(self,duration):
        start = datetime.now()
        self.env.state = self.child.run()
        self.agent.on()
        if self.plot: save_figure(self.env.x,self.env.y,self.env.state,[self.agent.position[0]],[self.agent.position[1]])
        while self.agent.active:
            self.agent.precepts(self.env.state)
            self.env.state = self.agent.effectors(self.env.state)
            if self.plot: save_figure(self.env.x,self.env.y,self.env.state,[self.agent.position[0]],[self.agent.position[1]])
            else: sleep(0.5)
            if (datetime.now() - start).seconds >= duration:
                self.agent.gohome()
                self.agent.precepts(self.env.state)
                self.env.state = self.agent.effectors(self.env.state)
                if self.plot: save_figure(self.env.x,self.env.y,self.env.state,[self.agent.position[0]],[self.agent.position[1]])
                else: sleep(0.5)
        rwd, clnd = self.agent.reward, self.agent.cleaned
        self.agent.reset()
        return rwd, clnd

예제 #2

파일 보기

파일: Q_main.py 프로젝트: filipmellgren/Pricing_algorithms

# Objects
agent1 = Agent()
agent2 = Agent()

# Initializations
writer = SummaryWriter(comment="-q-iteration")
iter_no = 0

# Q learning Algorithm
profits = np.zeros((ITER_BREAK + 2, NUM_EPISODES + 2))

for ep in range(NUM_EPISODES):
    print(ep)
    # 1: initialise Qs
    env.reset()
    agent1.reset()
    agent2.reset()
    iter_no = 0
    s_next = 0
    while True:
        iter_no += 1
        eps = 1 - np.exp(-BETA * (iter_no))
        # 2: agents choose actions simultanously.
        action1 = agent1.act(eps)
        action2 = agent2.act(eps)
        action = action1 * nA + action2
        # 3: outcomes are calculated
        s = s_next
        s_next, reward_n, done, prob = env.step(action)
        # 4: Bellman updates
        agent1.value_update(s, action1, reward_n[0], s_next)