def run_submission(cfg, output, nr): player = get_player(dumpdir=output) predfunc = get_predict_func(cfg) for k in range(nr): if k != 0: player.restart_episode() score = play_one_episode(player, predfunc) #, task='save_image') print("Total:", score)
def run_submission(cfg): dirname = 'gym-submit' player = get_player(dumpdir=dirname) predfunc = get_predict_func(cfg) for k in range(100): if k != 0: player.restart_episode() score = play_one_episode(player, predfunc) print("Total:", score)
def run_submission(cfg, output, nr): player = get_player(dumpdir=output) predfunc = OfflinePredictor(cfg) logger.info("Start evaluation: ") for k in range(nr): if k != 0: player.restart_episode() score = play_one_episode(player, predfunc) print("Score:", score)
def run_submission(cfg, output, nr): player = get_player(dumpdir=output) predfunc = OfflinePredictor(cfg) logger.info("Start evaluation: ") for k in range(nr): if k != 0: player.restart_episode() score = play_one_episode(player, predfunc) print("Score:", score)
def run_submission(cfg, output, nr): player = get_player(dumpdir=output) predfunc = get_predict_func(cfg) for k in range(nr): if k != 0: player.restart_episode() score = play_one_episode(player, predfunc, verbose=False) print("Total:", score) player.finish()
def run_submission(cfg, dump_dir='gym-submit'): dirname = dump_dir player = get_player(dumpdir=dirname) # player = get_player("/home/piotr.milos") predfunc = get_predict_func(cfg) for k in range(10): if k != 0: player.restart_episode() score = play_one_episode(player, predfunc) print("Total:", score)
def run_submission(cfg, output, nr): player, playerenv = get_player(dumpdir=output) predfunc = get_predict_func(cfg) logger.info("Start evaluation: ") for k in range(nr): if k != 0: player.restart_episode() score = play_one_episode(player, predfunc) print("The {0:d}th episodes, Total:".format(k), score) playerenv.gymenv.monitor.close()
def play(self, num_episodes, env, record=False, seed=None, tst=False): load = None if record: load = self.save self.player = self.get_player(dumpdir=load, seed=seed) if not record: self.predfunc = get_predict_func(self.cfg) if tst: self.predfunc = get_predict_func(self.cfg) rewards = [] if seed is not None: print('set seed', seed) self.player.player.player.gymenv.seed(seed) # logger.info("Start evaluation: ") for k in range(num_episodes): if k != 0: self.player.restart_episode() score = play_one_episode(self.player, self.predfunc) print(env + ' TP, score: ', score) rewards.append(score) return sum(rewards) / float(len(rewards))