コード例 #1
0
def main():

    env = make_atari("BreakoutNoFrameskip-v0")
    env = WarpFrame(env)
    env = FrameStack(env, k=4)

    act = deepq.load("breakout_model.pkl")

    while True:
        obs, done = env.reset(), False
        episode_rew = 0
        while not done:
            env.render()
            obs, rew, done, _ = env.step(act(obs[None])[0])
            episode_rew += rew
        print("Episode reward", episode_rew)
コード例 #2
0
level_string = 'MarbleZone.Act1'  #'StarLightZone.Act3'
movie_path = 'retro-movies/human/SonicTheHedgehog-Genesis/contest/SonicTheHedgehog-Genesis-{}-0000.bk2'.format(
    level_string)
movie = retro.Movie(movie_path)
movie.step()

scenario_string = 'test_retro'  #'test_retro' #'trajectory_max'
env = retro.make(game=movie.get_game(),
                 state=level_string,
                 scenario=scenario_string,
                 use_restricted_actions=retro.ACTIONS_ALL)
env = WarpFrame(env)

env.initial_state = movie.get_state()
_obs = env.reset()
obs_list = [_obs, _obs, _obs, _obs]
reward_list = [0., 0., 0.]

#turns action keys from movie into action number from sonic utils
#dictionary for these action keys:[['LEFT'], ['RIGHT'], ['LEFT', 'DOWN'], ['RIGHT', 'DOWN'], ['RIGHT', 'B'], ['DOWN'], ['NOOP'], ['B']]
NOOP_constant = 6


def sonic_define_action_dict():
    temp_dict = {}
    temp_dict['B'] = 7
    temp_dict['NOOP'] = 6
    temp_dict['DOWN'] = 5
    temp_dict['RIGHT', 'DOWN'] = 4
    temp_dict['LEFT', 'DOWN'] = 3