def test_box_space(self): env = gym.make("CartPole-v0") d = gym_space_to_dict(env.observation_space) sp = gym_space_from_dict(d) obs_space = env.observation_space _assert_array_equal( self.assertAlmostEqual, sp.low.tolist(), obs_space.low.tolist(), 0.001 ) _assert_array_equal( self.assertAlmostEqual, sp.high.tolist(), obs_space.high.tolist(), 0.001 ) _assert_array_equal(self.assertEqual, sp._shape, obs_space._shape) self.assertEqual(sp.dtype, obs_space.dtype)
def test_flex_dict(self): space = FlexDict({}) space["box"] = gym.spaces.Box(low=-1, high=1, shape=(1, 200)) space["discrete"] = gym.spaces.Discrete(2) space["tuple"] = gym.spaces.Tuple( (gym.spaces.Box(low=-1, high=1, shape=(1, 200)), gym.spaces.Discrete(2)) ) d = gym_space_to_dict(space) sp = gym_space_from_dict(d) self.assertTrue(isinstance(sp["box"], gym.spaces.Box)) self.assertTrue(isinstance(sp["discrete"], gym.spaces.Discrete)) self.assertTrue(isinstance(sp["tuple"], gym.spaces.Tuple))
def test_tuple_space(self): env = gym.make("CartPole-v0") space = gym.spaces.Tuple( spaces=[env.observation_space, env.action_space]) d = gym_space_to_dict(space) sp = gym_space_from_dict(d) _assert_array_equal( self.assertAlmostEqual, sp.spaces[0].low.tolist(), space.spaces[0].low.tolist(), 0.001, ) _assert_array_equal( self.assertAlmostEqual, sp.spaces[0].high.tolist(), space.spaces[0].high.tolist(), 0.001, ) _assert_array_equal(self.assertEqual, sp.spaces[0]._shape, space.spaces[0]._shape) self.assertEqual(sp.dtype, space.dtype) self.assertEqual(sp.spaces[1].n, space.spaces[1].n)