Python Env.start 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: reaver.envs.base

클래스/타입: Env

메소드/함수: start

hotexamples.com에서의 예제들: 3

Python Env.start - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 reaver.envs.base.Env.start에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

stop(3)

start(3)

render(1)

자주 사용되는 메소드들

stop (3)

start (3)

render (1)

예제 #1

파일 보기

 def run(self, env: Env, n_steps=1000000):
     env = self.wrap_env(env)
     env.start()
     try:
         self._run(env, n_steps)
     except KeyboardInterrupt:
         env.stop()

예제 #2

파일 보기

 def run(self, env: Env, expt, event_buffer=None, n_steps=1000000):
     env = self.wrap_env(env)
     env.start()
     try:
         self._run(env, expt, event_buffer, n_steps)
     except KeyboardInterrupt:
         env.stop()
         self.on_finish()

예제 #3

파일 보기

    def run(self, env: Env, n_steps=1000000):

        if self.args.test or (env.id
                              not in SUB_ENV_DICT) or (not self.args.HRL):
            # either testing or training without HRL at all
            # or the env selected does not have the subenvs
            if not self.args.HRL or self.args.HRL != 'separate':
                env = self.wrap_env(env)
                env.start()
                try:
                    self.on_start()
                    self._run(env, n_steps)
                except KeyboardInterrupt:
                    env.stop()

                self.on_finish()

            # testing with HRL and separate subenvs
            else:
                env = self.wrap_env(env)
                env.start()
                subenvs = SUB_ENV_DICT[env.id]
                print(
                    LOGGING_MSG_HEADER +
                    ": Ensure that you are testing models trained using the <HRL_separate> approach."
                )
                print(
                    LOGGING_MSG_HEADER +
                    ": Testing the {} with combined subpolicies trained seperately from subenvs-{}"
                    .format(env.id, subenvs))
                try:
                    self.on_start()
                    self._run_subenvs(env, n_steps, subenvs=subenvs)
                except KeyboardInterrupt:
                    env.stop()
                self.on_finish()

        else:

            assert self.args.HRL in [
                'human', 'systematic', 'random', 'sequential', 'separate'
            ]
            subenvs = SUB_ENV_DICT[env.id]
            print(LOGGING_MSG_HEADER + "： Subenvs are: ", subenvs)
            subenv_steps = [n_steps // len(subenvs) for subenv in subenvs]
            thresholds = [None for subenv in subenvs]

            if self.args.HRL in ['human', 'sequential', 'separate']:
                thresholds = HRL_thredhold(env.id)
                print(LOGGING_MSG_HEADER + "： Reward thresholds are: ",
                      thresholds)

            elif self.args.HRL == 'random':
                import numpy as np
                np.random.seed(1234)
                indices = sorted(
                    np.random.choice(n_steps, len(subenvs) - 1, replace=False))
                indices = [0] + sorted(
                    np.random.choice(n_steps, I - 1,
                                     replace=False)) + [n_steps]
                subenv_steps = np.ediff1d(indices)
            elif self.args.HRL == 'systematic':
                pass
                #  subenv_steps already defined and initializied

            for i, (subenv, subenv_step, threshold) in enumerate(
                    zip(subenvs, subenv_steps, thresholds)):
                env = SC2Env(subenv, env.render, max_ep_len=env.max_ep_len)
                print(
                    LOGGING_MSG_HEADER +
                    ": Creating and Running subenv : {} with maximum {} steps, and reward threshold is {}."
                    .format(env.id, subenv_step, threshold))
                env = self.wrap_env(env)
                env.start()
                try:
                    self.on_start()
                    if i != 0:
                        self.reset()
                    self._run(env, subenv_step, threshold, subenv_id=i)
                except KeyboardInterrupt:
                    env.stop()
                    break
            self.on_finish()
        """