예제 #1
0
threshold = 0.00001
'''
Do not edit below here
'''

start_time = time.time()
g = PredatorGame((0,0), (5,5), (11,11))
print "\n----------------\nExample: Policy Iteration\n----------------"               
preyPosition = (5,5)

V, c, policy = g.policyIteration(discount, threshold)

print "Iterations: " + str(c)

example = []
preds = [(a, b) for a in range(11) for b in range(11)]
for p in preds:
    example.append((p, preyPosition))

# for e in example:
#     print (str(e[0]) + "-->" +  str(round(V[e], 3)))

valuesMatrix = np.zeros((g.boardSize[0], g.boardSize[1]))

for e in example:
    valuesMatrix[e[0][0]][e[0][1]] = round(V[g.getState(*e)], 4)

g.checkerboard_table(valuesMatrix, preyPosition)
plt.show()
elapsed_time = time.time() - start_time
print("Elapsed time: " + str(elapsed_time))
예제 #2
0
import numpy as np
import time
import matplotlib.pyplot as plt
sys.path.append("..")
sys.path.append("./")
from predatorgame import PredatorGame

'''
Edit parameters
'''
discount = 0.8
threshold = 0.00001
'''
Do not edit below here
'''

start_time = time.time()
g = PredatorGame((0,0), (5,5), (11,11))

print "\n----------------\nExample: Iterative Policy Evaluation\n----------------"           

V, c = g.iterativePolicyEvaluation(discount, threshold)

targets = [((0,0), (5,5)), ((2,3), (5,4)), ((2,10), (10,0)), ((10,10), (0,0))]

for ex in targets:
    print str(ex) +  ": "  + str(V[g.getState(*ex)])
print "Iterations: " + str(c)

elapsed_time = time.time() - start_time
print("Elapsed time: " + str(elapsed_time))