Ejemplos de f_fwgym_get_env en Python, ejemplos de utils.gym_gen.f_fwgym_get_env en Python

Ejemplo n.º 1

0

Mostrar archivo

Archivo: train.py Proyecto: uber-research/rl-controller-verification

    def f_clw_instantiate_envs(self): 
        """ Instantiate both the Training and Test Gym Env 
        - They provide the same dynamical model and the same reward 
        """
        temp = 'gym_quadcopter:quadcopter-v' + str(self.env_desc.get_env_id())
        # TODO FIXME: Some models cannot handle multiple envs.
        N = self.env_desc.get_n_envs()
        if N < 1: 
            raise RuntimeError(f"Got NumEnvs needs to be >=1 but got NumEnvs={N}")
        logging.info(f"[SETUP] Creating {N} Training Environments - START")

        # Instantiating all the Envs and storing them into a private var 
        self.__envs_training = [f_fwgym_get_env(
            env_id=temp, used_states=self.used_states, instance_index=i,
            query_classes=self.query_classes, query_class=self.query_class,
            params=self.args.training_params
        ) for i in range(N)]

        # Passing references to previously created envs 
        self.env = DummyVecEnv([lambda: self.__envs_training[i] for i in range(N)]) 
        logging.info(f"[SETUP] Creating {N} Training Environments - DONE")
        logging.info(f"[SETUP] Creating 1 Test Environments - START")
        self.env_test = f_fwgym_get_env(
            env_id=temp, used_states=self.used_states, instance_index=0,
            query_classes=self.query_classes, query_class=self.query_class,
            params=self.args.testing_params
        )
        logging.info(f"[SETUP] Creating 1 Test Environments - DONE")

Ejemplo n.º 2

0

Mostrar archivo

Archivo: envs_test.py Proyecto: uber-research/rl-controller-verification

    def test_env_make(self):
        """ Testing Env0 State Space Size
        """
        instance_index = 0
        action = np.array([1.0, 2.0, 3.0])
        env_id = 'gym_quadcopter:quadcopter-v2'

        env1 = f_fwgym_get_env(
            env_id=env_id, used_states = ['e_p', 'e_q', 'e_r'],
            instance_index=instance_index, query_class='something',
            query_classes={}, params=self.testing_params
        )
        env1.reset()
        self.assertEqual(env1.params, self.testing_params)

        quadcopter = Quadcopter(T=20, dt_commands=0.03, dt=0.01)
        env2 = GymEnvBase.make(
            env_id=env_id, instance_index=instance_index,
            params=self.testing_params, quadcopter=quadcopter,
            used_states=['e_p', 'e_q', 'e_r']
        )
        env2.reset()
        self.assertEqual(env2.params, self.testing_params)
        self.assertEqual(env1.env_id, env2.env_id)
        self.assertEqual(env1.instance_index, env2.instance_index)
        self.assertEqual(env1.continuous, env2.continuous)

Ejemplo n.º 3

0

Mostrar archivo

    def run_test(self):
        """ Runs the old tests or the new properties observer based ones
        """
        if self.args.eval_properties_observer['is_active']:
            return self.compute_traces()

        logging.info(f"Start test at {dt.now().strftime('%Y%m%d_%H%M')}")
        logging.info(f"Test Arguments\n{self._args2str(self.args)}")
        self.f_fwtfw_init()

        temp = 'gym_quadcopter:quadcopter-v' + str(self.args.env)

        self.env = f_fwgym_get_env(env_id=temp,
                                   used_states=self.args.used_states,
                                   instance_index=0,
                                   query_classes=self.args.query_classes,
                                   query_class=self.args.query_class,
                                   params=self.args.testing_params)
        logging.info(
            f"[eval_models.py] Instantiated env {str(temp)} with continuous {str(self.args.continuous)}"
        )
        checkpoints = self.range_checkpoints()
        rewards, s_rates = self.f_checkpoints_range_2_mean_performance(
            checkpoints=checkpoints)

        starting_min_reward = -10

        temp_x = [0] + [
            self.args.num_iterations_checkpoint * i for i in range(
                self.args.start_index, self.args.end_index, self.args.step)
        ]
        temp_y = [starting_min_reward] + list(rewards)
        f_iofsw_plot(
            x=temp_x,
            y=temp_y,
            x_ticks=np.array(temp_x),
            y_ticks=np.array(temp_y),
            title="Rewards",
            label_x="Training Timesteps",
            label_y="Average Rewards",
            filename=
            f"{self.args.plots_dir}/Timesteps_Rewards_{dt.now().strftime('%Y%m%d_%H%M%S')}.png",
        )

        temp_x = [0] + [
            self.args.num_iterations_checkpoint * i for i in range(
                self.args.start_index, self.args.end_index, self.args.step)
        ]
        temp_y = [0] + list(s_rates)
        f_iofsw_plot(
            x=temp_x,
            y=temp_y,
            x_ticks=np.array(temp_x),
            y_ticks=np.array(temp_y),
            title="Success Rate",
            label_x="Training Timesteps",
            label_y="Average Success Rate",
            filename=
            f"{self.args.plots_dir}/Timesteps_SuccessRate_{dt.now().strftime('%Y%m%d_%H%M%S')}.png",
        )

Ejemplo n.º 4

0

Mostrar archivo