Python computeValue Exemples, lp.computeValue Python Exemples

Exemple #1

0

Afficher le fichier

Fichier : greedyConstructionAgents.py Projet : shunzh/RLCodeBase

 def __init__(self, cmp, rewardSet, initialPhi, queryType, gamma, qi=False):
   """
   qi: query iteration
   """
   QTPAgent.__init__(self, cmp, rewardSet, initialPhi, queryType, gamma)
   # do query iteration?
   self.qi = qi
   self.m = 1
   
   if hasattr(self, 'computePiValue'):
     # policy gradient agent has different ways to compute values..
     self.computeV = lambda pi, S, A, r, horizon: self.computePiValue(pi, r, horizon)
   else:
     self.computeV = lambda pi, S, A, r, horizon: lp.computeValue(pi, r, S, A)

Exemple #2

0

Afficher le fichier

    def __init__(self, mdp, k):
        """
    qi: query iteration
    """
        self.mdp = mdp
        self.k = k

        if hasattr(self, 'computePiValue'):
            # policy gradient agent has different ways to compute values..
            self.computeV = lambda pi, S, A, r, horizon: self.computePiValue(
                pi, r, horizon)
        else:
            self.computeV = lambda pi, S, A, r, horizon: lp.computeValue(
                pi, r, S, A)

Exemple #3

0

Afficher le fichier

    def __init__(self, cmp, rewardSet, initialPhi, queryType, gamma, qi=False):
        """
    qi: query iteration
    """
        QTPAgent.__init__(self, cmp, rewardSet, initialPhi, queryType, gamma)
        # do query iteration?
        self.qi = qi
        self.m = 1

        if hasattr(self, 'computePiValue'):
            # policy gradient agent has different ways to compute values..
            self.computeV = lambda pi, S, A, r, horizon: self.computePiValue(
                pi, r, horizon)
        else:
            self.computeV = lambda pi, S, A, r, horizon: lp.computeValue(
                pi, r, S, A)

Exemple #4

0

Afficher le fichier

Fichier : consQueryAgents.py Projet : shunzh/RLCodeBase

 def computeValue(self, x):
   return computeValue(x, self.mdp.r, self.mdp.S, self.mdp.A)

Exemple #5

0

Afficher le fichier

Fichier : consQueryAgents.py Projet : ashdtu/constrained-MDP

 def computeValue(self, x):
     """
 compute the value of policy x. it computes the dot product between x and r
 """
     return computeValue(x, self.mdp.r, self.mdp.S, self.mdp.A)

Exemple #6

0

Afficher le fichier

 def computeValue(self, x):
     return computeValue(x, self.mdp.r, self.mdp.S, self.mdp.A)