Python LinearApproximator Examples

Programming Language: Python

Namespace/Package Name: tools

Examples at hotexamples.com: 2

Python LinearApproximator - 2 examples found. These are the top rated real world Python examples of tools.LinearApproximator extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

getBestActionMaxQValue(1)

updateWeights(1)

Example #1

Show file

File: qLearningAgent.py Project: machaneus/RL-on-VREP

class ApproximateQLearningAgent:
    def __init__(self, eps, alpha, discount, targetPos, actionStrategy="Absolute"):
        if actionStrategy == "Absolute":
            self.actions = ((-1, -1), (-1, 0), (-1, 1), (1, -1), (1, 0), (1, 1))
        elif actionStrategy == "Differential":
            self.actions = ((-1, -1), (-1, 0), (-1, 1), (0, -1), (0, 0), (0, 1), (1, -1), (1, 0), (1, 1))
        else:
            print "Not valid action strategy"
            return
        self.QValues = LinearApproximator(self.actions, targetPos)
        self.eps = eps
        self.alpha = alpha
        self.discount = discount

    def getBestActionMaxQValue(self, state):
        bestAction, maxQValue = self.QValues.getBestActionMaxQValue(state)
        return (bestAction, maxQValue)

    def selectAction(self, state):
        r = random.uniform(0, 1)
        if r < self.eps:
            # print "-- Action selected randomly --"
            return self.actions[random.randint(0, len(self.actions) - 1)]
        else:
            # print "-- Action selected optimally --"
            bestAction = self.getBestActionMaxQValue(state)[0]
            return bestAction

    def update(self, state, action, newState, reward):
        self.QValues.updateWeights(state, action, newState, reward, self.discount, self.alpha)

Example #2

Show file

File: qLearningAgent.py Project: machaneus/RL-on-VREP

 def __init__(self, eps, alpha, discount, targetPos, actionStrategy="Absolute"):
     if actionStrategy == "Absolute":
         self.actions = ((-1, -1), (-1, 0), (-1, 1), (1, -1), (1, 0), (1, 1))
     elif actionStrategy == "Differential":
         self.actions = ((-1, -1), (-1, 0), (-1, 1), (0, -1), (0, 0), (0, 1), (1, -1), (1, 0), (1, 1))
     else:
         print "Not valid action strategy"
         return
     self.QValues = LinearApproximator(self.actions, targetPos)
     self.eps = eps
     self.alpha = alpha
     self.discount = discount