Python Agent.input_vector 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: agents

클래스/타입: Agent

메소드/함수: input_vector

hotexamples.com에서의 예제들: 1

Python Agent.input_vector - 1개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 agents.Agent.input_vector에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Agent(30)

run_episode(4)

act(4)

__init__(3)

name(3)

get_move(3)

eval(3)

mark(2)

move(2)

get_action(2)

from_conf(2)

reset(2)

learn(2)

test(2)

build_trajectories(2)

ships(1)

log_activity_active(1)

log_activity_idle(1)

update_t_pref(1)

update_belief(1)

train_model(1)

train(1)

on(1)

parameters(1)

ppo_update(1)

precepts(1)

symbol(1)

set_train_mode(1)

stop(1)

preference_position(1)

step(1)

program(1)

state(1)

load_curve_certificate(1)

start(1)

sample_duration_current_state(1)

save(1)

set_current_activity_end(1)

reset_graph_info(1)

input_vector(1)

load(1)

choose_state(1)

ac_model(1)

add_actuator(1)

add_event(1)

add_id(1)

add_sensor(1)

append_sample(1)

bombs_left(1)

예제 #1

파일 보기

파일: evaluation.py 프로젝트: temminks/Thesis

class Evaluator(J30Runner):
    def __init__(self, model_name, model):
        super().__init__(train=False)

        self.model_name = model_name
        self.model = model.model
        self.agent = Agent(self.projects, model)
        self.result = []

    def load_weights(self, number):
        self.model.load_weights('.\\models\\' + self.model_name + '\\' +
                                self.model_name + '-' + str(number) + '.h5')

    def evaluate_project(self, project) -> float:
        t = 0

        while not project.is_finished():
            t += project.next(*self.act(project))

        return t

    def evaluate(self, num_of_iterations=100):
        """Evaluates a single project for the number of iterations."""
        durations = {}

        for project in self.projects:
            project_list = np.array([
                Project(project.path, stochastic=project.stochastic)
                for _ in range(num_of_iterations)
            ])
            durations[project.path[-8:]] = np.vectorize(
                self.evaluate_project, otypes=[float])(project_list)

        return durations

    def evaluate_all(self, num_of_models, num_of_iterations=100):
        for num_of_model in range(num_of_models):
            print('evaluating model', num_of_model)
            self.load_weights(num_of_model)
            self.result.append(self.evaluate(num_of_iterations))
            pickle.dump(
                self.result,
                open(self.model_name + '-result-' + str(num_of_model), 'wb'))

    def act(self, project):
        """The action with the highest value is executed.

        This function is different from the act-function during training: If no
        tasks are running, the model cannot choose the wait/void action. This
        prevents infinite loops if the wait/void action for such a state has the
        highest q-value.

        :return: the best action and the durations of the tasks in the action
        """
        state, durations = project.state()
        actions = project.get_actions()

        if len(actions) > 1:
            best_action = self.get_best_action(state, actions, project)
            return best_action, durations
        else:
            best_action = []
            return best_action, durations

    def get_best_action(self, state, actions, project):
        inputs = np.squeeze(
            np.array([
                self.agent.input_vector(state, action) for action in actions
            ]))
        action_values = np.squeeze(self.model.predict(inputs, len(inputs)))
        max_val = np.argmax(action_values)
        # the wait/void action must not be the best action if there are no running tasks
        if len(project.running) == 0 and actions[max_val] == []:
            max_val = np.argmax(action_values[1:]) + 1
        return actions[max_val]