iters = 150 learner = Learner() scores = [] for ii in xrange(iters): # Make a new monkey object. swing = SwingyMonkey(sound=False, # Don't play sounds. text="Epoch %d" % (ii), # Display the epoch on screen. tick_length=1, # Make game ticks super fast. action_callback=learner.action_callback, reward_callback=learner.reward_callback) # Loop until you hit something. while swing.game_loop(): pass scores.append(swing.get_score()) # Reset the state of the learner. learner.reset() domain = np.arange(1, iters + 1, 1) plt.plot(domain, scores) plt.title("Scores over each Epoch (discount = " + str(learner.discount) + ")") plt.xlabel("Epoch") plt.ylabel("Score") plt.savefig("scores.png") plt.show()