def main(): world = GridWorld() q_table = np.zeros([len(world.available_actions()), 7, 10]) q_table = train(world, q_table) moves = evaluate(world, q_table) print 'Moves: ' + str(moves) print 'Steps: ' + str(len(moves))