def main(): if flag.MARIO_ENV: env = mario_env.make_train_0() if flag.TRAIN: new_trainer = Trainer(num_training_steps=200000, num_epoch=3, batch_size=16, learning_rate=0.0001, discount_factor=0.99, env=env, num_action=7, save_interval=100, log_interval=50, decay_rate=0.001, num_steps=16, memory_size=10000, update_target_net_interval=5) new_trainer.collect_experience_and_train() elif flag.PLAY: new_player = Player(env=env, load_path='./step5500-20191027-162213/train') new_player.play()