Ejemplo n.º 1
0
            agent.episode()
            if agent.episodes > 1 and not agent.episodes % interval:
                winrate = sum(agent.goal) / len(agent.goal)
                avgsteps = sum(agent.last100) / len(agent.last100)
                wstr += ',{}'.format(winrate)
                astr += ',{}'.format(avgsteps)
                print('Episode {}...'.format(agent.episodes))
        w.write(wstr + '\n')
        a.write(astr + '\n')
        agent.reset()
    w.write('Alpha\n')
    a.write('Alpha\n')
    w.write(top_label)
    a.write(top_label)
    print('Testing Alphas...')
    for alpha in tenths:
        agent.alpha = alpha
        wstr = astr = '{},0'.format(alpha)
        for i in range(episodes):
            agent.episode()
            if agent.episodes > 1 and not agent.episodes % interval:
                winrate = sum(agent.goal) / len(agent.goal)
                avgsteps = sum(agent.last100) / len(agent.last100)
                wstr += ',{}'.format(winrate)
                astr += ',{}'.format(avgsteps)
                print('Episode {}...'.format(agent.episodes))
        w.write(wstr + '\n')
        a.write(astr + '\n')
        agent.reset()