def __init__(self, name): self.env = minatar.Environment(name) self.obs_dim = 10 * 10 * self.env.n_channels self.in_channels = self.env.state_shape()[2] self.action_dim = self.env.num_actions() self.num_actions = self.env.num_actions() self.name = self.env.game_name()
def __init__(self, game_name): self.env = minatar.Environment(env_name=game_name) self.env.n = self.env.num_actions() self.game_over = False
parser.add_argument('--env-name', type=str, default='asterix') parser.add_argument('--env-training-seed', type=int, default=0) parser.add_argument('--env-evaluation-seed', type=int, default=1) parser.add_argument('--seed', type=int, default=100) # ------------------------------------------------------------------------------------------------------------------ config = vars(parser.parse_args()) env, eval_env = None, None if config['env_type'] == 0: # 0: LavaWorld env = lavaworld.environment.Environment( seed=config['env_training_seed']) eval_env = lavaworld.environment.Environment( seed=config['env_evaluation_seed']) elif config['env_type'] == 1: # 1: MinAtar env = minatar.Environment(config['env_name'], sticky_action_prob=0.0, difficulty_ramping=False, random_seed=config['env_training_seed'], time_limit=2000) eval_env = minatar.Environment( config['env_name'], sticky_action_prob=0.0, difficulty_ramping=False, random_seed=config['env_evaluation_seed'], time_limit=2000) executor = Executor(config, env, eval_env) executor.run()