def setup_method(self): self.env = GridWorldEnv(desc='4x4') self.policy = ScriptedPolicy( scripted_actions=[2, 2, 1, 0, 3, 1, 1, 1, 2, 2, 1, 1, 1, 2, 2, 1]) self.algo = Mock(env_spec=self.env.spec, policy=self.policy, max_episode_length=16)
def other_envs(): descs = [ ['SFFF', 'FFFF', 'FFFF', 'FFFF'], ['FFSF', 'FFFH', 'FHFH', 'HFFG'], ['FHSF', 'FFFH', 'FHFH', 'HFFG'], ['FHSF', 'FGFH', 'FHFH', 'HFFH'], ['SHFF', 'HHFF', 'FFFF', 'FFFF'], ] return [GridWorldEnv(desc=desc) for desc in descs]
def envs(): descs = [ ['SFFF', 'FHFH', 'FFFH', 'HFFG'], ['SFFF', 'FFFH', 'FHFH', 'HFFG'], ['SFFF', 'FFFH', 'FHFH', 'FFFG'], ['SFFF', 'FFFF', 'FFFF', 'FFFF'], ['SHFF', 'HHFF', 'FFFF', 'FFFF'], ] return [GarageEnv(GridWorldEnv(desc=desc)) for desc in descs]
def other_envs(): descs = [ ['FFFS', 'FHFH', 'FFFH', 'HFFG'], ['FFSF', 'FFFH', 'FHFH', 'HFFG'], ['FFFF', 'FFSH', 'FHFH', 'FFFG'], ['FFFF', 'FFFF', 'FSFF', 'FFFF'], ['HHFF', 'HHHF', 'HSHF', 'HHHF'], ] return [GarageEnv(GridWorldEnv(desc=desc)) for desc in descs]
def env(): return GridWorldEnv(desc='4x4')
def env(): return GarageEnv(GridWorldEnv(desc='4x4'))