Exemplos de ReinforcementAgent em Python, exemplos de learningAgents.ReinforcementAgent em Python

Exemplo n.º 1

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: wustladela/cse511hw3

  def __init__(self, **args):
    "You can initialize Q-values here..."
    ReinforcementAgent.__init__(self, **args)

    "*** YOUR CODE HERE ***"
    """
    pseudo code:
    allowed function: self.getLegalActions(state)
    create a counter for (state, action), value
      the key of counter is state action pair.
    if there is nothing learned, then it's 0.0
    every time new state gets reward, ???
    for k = 1 to ...:
      for each state s: 
        for action in allActions:
          for eachOutcome in transition:
            immediateReward = ...
            discountedFuture = ...
            nextState value = immediateReward + discountedFuture
            result = probs * nextState value
        find the best action according to chooseAction
        return that one.

        use the batch version: each vk is computed from a fixed v(k-1) not updated at all
        use 
        ---
    collect policy according to value/action later.  
    """
    """
    ---but we don't need to do much in init
    """
    self.qvalues = util.Counter()
    self.values = util.Counter()

Exemplo n.º 2

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: yihui-he/AI-CS_188

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        self.Qvalues=dict()
        self.visit=dict()

Exemplo n.º 3

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: phoxelua/cs188-reinforcement

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        # print args
        "*** YOUR CODE HERE ***"
        self.qvalues = util.Counter()

Exemplo n.º 4

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: aupreti/AI

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        #initialize a dictionary. The dictionary is indexed by a tuple and everything is initialized to 0 at the beginning
        self.qValueMap= util.Counter()

Exemplo n.º 5

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: realityfightsback/Project3_RL

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # Will use counter(Map) with key as State + Action, Value as value
        self.Q = util.Counter()

Exemplo n.º 6

0

Exibir arquivo

Arquivo: qlearningAgents_tree.py Projeto: botonchou/NTUChinese

	def __init__(self, numOfTurn, numofgauss, var, lamda, gaussDim, **args):
		"You can initialize Q-values here..."
		ReinforcementAgent.__init__(self, **args)
		self.qVal = util.Counter()
		self.numofgauss = numofgauss
		self.var = var
		self.lamda = lamda
		self.numOfTurn = numOfTurn
		self.gaussDim = gaussDim
	
		# init basis 
		self.basis = []
		for i in range(self.numofgauss):
			base = {}
			base['mean'] = np.matrix( [ float(i)/float(self.numofgauss) for j in range(0,self.gaussDim)] )
			base['var'] = np.matrix( np.diag([self.var for j in range(0,self.gaussDim)]) )
			base['detOfVar'] = np.linalg.det(base['var']) # pre-calculate deteminant of covariance
			base['invOfVar'] = np.linalg.inv(base['var']) # pre-calculate inverse of covariance
			self.basis.append(base)

		# init parameters
		self.thetas = {}
		self.phis = {}
		self.labels = {}
		self.state_action_num = 0
		for t in range(0,self.numOfTurn):
			for a in util.turnIndex2action('b','cycle_tree',t):
				self.thetas[(t,a)] = np.matrix([[0.0] \
				for i in range(self.numofgauss)])	
				self.phis[(t,a)] = [[] for i in range(self.numofgauss)]
				self.labels[(t,a)] = []
				self.state_action_num += 1 # count self.state_action_num

Exemplo n.º 7

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: shayne1993/ArtificialIntelligence

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # qValues ((state, action), Q(s,a))
        self.qValues = util.Counter()

Exemplo n.º 8

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: dwarrier/CS188-projects

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # maps (state, action) pairs to Q values
        self.qvalues = Counter()

Exemplo n.º 9

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: prashar/pacman

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        # Current state of the board
        # based on whatever the agent has learnt so far.
        self.qlearntVals = util.Counter()

Exemplo n.º 10

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: Ray-Zhang/artificial_intelligence_practice

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # the data structure of qValues is: {state, {action, value}}
        self.qValues = {}

Exemplo n.º 11

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: asterter5/Universidad

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        self.qValues = util.Counter()
        self.state_uses = util.Counter()

Exemplo n.º 12

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: Besermenji/PacMan---Q-learning

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # initializing q vaules dictionary
        self.q_values = defaultdict(util.Counter)

Exemplo n.º 13

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: Kunal-Bohra/Pacman-Artificial-Intelligence-Based-Projects

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)
        #Using uitl.Counter from util.py
        self.states = util.Counter() 

        "*** YOUR CODE HERE ***"

Exemplo n.º 14

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: lisha1992/pacman-reinforcement-learning

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        ## Create a dictionary object to record all Q_values in Counter() version
        self.Q_Values=util.Counter()

Exemplo n.º 15

0

Exibir arquivo

Arquivo: qlearningAgents_tree_old.py Projeto: botonchou/NTUChinese

	def __init__(self, numOfTurn, numofgauss=5, var=0.25, lamda=0, **args):
		"You can initialize Q-values here..."
		ReinforcementAgent.__init__(self, **args)
		self.qVal = util.Counter()
		self.numofgauss = numofgauss
		self.var = var
		self.lamda = lamda
		self.numOfTurn = numOfTurn

		if self.numofgauss<=5:
			self.minimumNum = 10
		else:
			self.minimumNum = 20

		# init basis 
		self.basis = []
		for i in range(self.numofgauss):
			base = {}
			base['mean'] = [ float(i)/float(self.numofgauss) for j in range(0,82)]
			base['var'] = np.diag([var for j in range(0,82)])
			self.basis.append(base)

		# init parameters
		self.thetas = {}
		self.phis = {}
		self.labels = {}
		self.state_action_num = 0
		for t in range(0,self.numOfTurn):
			for a in util.turnIndex2action('b','cycle_tree',t):
				self.thetas[(t,a)] = np.matrix([[0.0] \
				for i in range(self.numofgauss)])	
				self.phis[(t,a)] = [[] for i in range(self.numofgauss)]
				self.labels[(t,a)] = []
				self.state_action_num += 1 # count self.state_action_num

Exemplo n.º 16

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: dhruvarora/Reinforcement-Learning

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)
        self.qVals = util.Counter()
        #self.rando = FixedRandom().random

        "*** YOUR CODE HERE ***"

Exemplo n.º 17

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: zych1751/AI

 def __init__(self, **args):
     "You can initialize Q-values here..."
     ReinforcementAgent.__init__(self, **args)
     #print "ALPHA", self.alpha
     #print "DISCOUNT", self.discount
     #print "EXPLORATION", self.epsilon
     self.qValues = util.Counter()

Exemplo n.º 18

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: mattwenner/ai

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        #keeps track of q values
        self.values = util.Counter()

Exemplo n.º 19

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: ChristopherKai/ai

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        
        self.qTable = {}

Exemplo n.º 20

0

Exibir arquivo

Arquivo: tglearningAgents.py Projeto: shunzh/Keepaway

  def __init__(self, **args):
    "You can initialize Q-values here..."
    ReinforcementAgent.__init__(self, **args)

    "*** YOUR CODE HERE ***"
    self.values = util.Counter()
    self.predicate = BlocksworldPred(self.mdp.count, self.mdp.stackNum)
    self.root = QTreeNode(.01, self.mdp.count) # FIXME epsilon should passed via command line

Exemplo n.º 21

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: zarate8/AI-ReinforcementLearning

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        # Initialized values
        # Extension of dictionary
        # Keeps track of counts for a set of keys
        self.values = util.Counter()

Exemplo n.º 22

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: tngan/msc-7404

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # Just copy it from valueIterationAgents.py
        # A Counter is a dict with default 0
        self.values = util.Counter()

Exemplo n.º 23

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: jacnik/BerkeleyXAI

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        #import pdb; pdb.set_trace()
        # qvalues are organised as a util.Counter() of (state, action) pairs
        self.qvalues = util.Counter()

Exemplo n.º 24

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: Pava1n3/learntoplay

 def __init__(self, **args):
     "You can initialize Q-values here..."
     ReinforcementAgent.__init__(self, **args)
     
     states = []
     "*** YOUR CODE HERE ***"
     # keep a Counter/Dictionary of Q-values
     self.qvalues = util.Counter()

Exemplo n.º 25

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: vsubhashini/RL-bot

  def __init__(self, **args):
    "You can initialize Q-values here..."
    ReinforcementAgent.__init__(self, **args)

    "*** YOUR CODE HERE ***"
    self.QValues = util.Counter()
    #self.qtype=qtype
    self.environment=None

Exemplo n.º 26

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: trimcao/artificial-intelligence-uc-berkeley

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # qValues is a dict of util.Counter()
        self.qValues = {}
        self.visitCount = {}

Exemplo n.º 27

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: MarcBeltran/Berkeley-AI-Course

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        # En el init creamos un diccionario vacio donde
        # guardar la informacion de los estados.
        self.qValues = util.Counter()

Exemplo n.º 28

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: Mithrandir0x/ia

 def __init__(self, **args):
   """
   You can initialize Q-values here...
   """
   ReinforcementAgent.__init__(self, **args)
   self.Q = util.Counter()
   # Modify this value to set how many actions to choose randomly before selecting greedily
   self.greedy_constraint = 100
   self.to_greedy = 0

Exemplo n.º 29

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: lyeechong/ai

  def __init__(self, **args):
    "You can initialize Q-values here..."
    ReinforcementAgent.__init__(self, **args)

    "*** YOUR CODE HERE ***"
    #OUR CODE HERE
    #So I guess we need to make a counter to stick Q values in
    #Everything in it will be 0 because it's a counter
    self.qvalues = util.Counter()

Exemplo n.º 30

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: lucasosouza/berkeleyAI

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        #self.values = util.Counter()
        self.qValues = util.Counter()
        self.stateProbs = dict()
        self.rewards = util.Counter()

Exemplo n.º 31

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: madetobore/CMPS140

 def __init__(self, **args):
     "You can initialize Q-values here..."
     ReinforcementAgent.__init__(self, **args)
     self.qValues = util.Counter(
     )  #similar to values in valueIterationAgents.py

Exemplo n.º 32

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: liaojdl/Unimelb_COMP90054_2020_SM1_AI_Planning_for_Autonomy_Pacman_Assignments

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        self.Qvalues = defaultdict(lambda: defaultdict(float))

Exemplo n.º 33

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: slaglj/pacman_project

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        self.QVals = util.Counter()

Exemplo n.º 34

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: amathsow/TAMER-Summer-2018-Lab

 def startEpisode(self):
     ReinforcementAgent.startEpisode(self)
     self.episode_epsilon = self.episode_init_epsilon

Exemplo n.º 35

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: mahaalkh/CS4100_Artificial_Intelligence

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"        
        self.qValues = util.Counter()

Exemplo n.º 36

0

Exibir arquivo

 def __init__(self, **args):
     "You can initialize Q-values here..."
     ReinforcementAgent.__init__(self, **args)
     "*** YOUR CODE HERE ***"
     self.statesActions = {}

Exemplo n.º 37

0

Exibir arquivo

Arquivo: qlearningAgents.py Projeto: yinsidij/AI-Pacman

    def __init__(self, **args):
        "You can initialize Q-values here..."
        ReinforcementAgent.__init__(self, **args)

        "*** YOUR CODE HERE ***"
        self.qValueHash = dict()