Ejemplo n.º 1
0
    sarsa_vals = []
    random_vals = []

    print("====================================")
    print("          AGENT COMPARISON          ")
    print("====================================")

    print()
    print("SARSA agent with Fourier series vs Random Action agent")
    print()
    print("Simulating...")
    for i in range(1, ep_count+1):
        print("Episode %d" % i)
        print("\tSARSA episode...", end="")
        sys.stdout.flush()
        sarsa_vals += [sarsa_sim.run_episode()]
        print(" Done. Reward: %d" % sarsa_vals[-1])
        print("\tRandom episode...", end="")
        sys.stdout.flush()
        random_vals += [random_sim.run_episode()]
        print(" Done. Reward: %d" % random_vals[-1])
        print()
    
    print("Average SARSA reward: %.5f +- %.2f" % (np.mean(sarsa_vals), np.std(sarsa_vals, ddof=1)))
    print("Average Random reward: %.5f +- %.2f" % (np.mean(random_vals), np.std(random_vals, ddof=1)))
    print()
    print("SARSA points: %s" % str(sarsa_vals))
    print("Random points: %s" % str(random_vals))
    print()
    #print()
    #print("Plots:")