def main(): env = make_atari("BreakoutNoFrameskip-v0") env = WarpFrame(env) env = FrameStack(env, k=4) act = deepq.load("breakout_model.pkl") while True: obs, done = env.reset(), False episode_rew = 0 while not done: env.render() obs, rew, done, _ = env.step(act(obs[None])[0]) episode_rew += rew print("Episode reward", episode_rew)
level_string = 'MarbleZone.Act1' #'StarLightZone.Act3' movie_path = 'retro-movies/human/SonicTheHedgehog-Genesis/contest/SonicTheHedgehog-Genesis-{}-0000.bk2'.format( level_string) movie = retro.Movie(movie_path) movie.step() scenario_string = 'test_retro' #'test_retro' #'trajectory_max' env = retro.make(game=movie.get_game(), state=level_string, scenario=scenario_string, use_restricted_actions=retro.ACTIONS_ALL) env = WarpFrame(env) env.initial_state = movie.get_state() _obs = env.reset() obs_list = [_obs, _obs, _obs, _obs] reward_list = [0., 0., 0.] #turns action keys from movie into action number from sonic utils #dictionary for these action keys:[['LEFT'], ['RIGHT'], ['LEFT', 'DOWN'], ['RIGHT', 'DOWN'], ['RIGHT', 'B'], ['DOWN'], ['NOOP'], ['B']] NOOP_constant = 6 def sonic_define_action_dict(): temp_dict = {} temp_dict['B'] = 7 temp_dict['NOOP'] = 6 temp_dict['DOWN'] = 5 temp_dict['RIGHT', 'DOWN'] = 4 temp_dict['LEFT', 'DOWN'] = 3