Esempio n. 1
0
 def greedy(self, state):
     maxval = float('-inf')
     maxmove = None
     for i in range(7):
         if c4.isValidMove(state, i):
             new_state = c4.makeMove(state, self.player, i)
             val = self.lookup(new_state)
             if val > maxval:
                 maxval = val
                 maxmove = i
     self.backup(maxval)
     return maxmove
 def greedy(self, state):
     maxval = float('-inf')
     maxmove = None
     for i in range(7):
         if c4.isValidMove(state, i):
             new_state = c4.makeMove(state, self.player, i)
             val = self.lookup(new_state)
             if val > maxval:
                 maxval = val
                 maxmove = i
     self.backup(maxval)
     return maxmove
Esempio n. 3
0
 def greedy(self, state, player=1):
     max_value = float("-inf")
     next_move = None
     # TODO: implemen get_possible_moves in c4
     for move in range(7):
         if c4.isValidMove(state, move):
             new_state = c4.makeMove(state, player, move)
             val = self.net.predict(c4.getNeuralInput(new_state).reshape(1, 126), batch_size=1)
             if val > max_value:
                 max_value = val
                 next_move = move
     self.backup(max_value)
     return next_move
Esempio n. 4
0
 def greedy(self, state, player=1):
     max_value = float("-inf")
     next_move = None
     # TODO: implemen get_possible_moves in c4
     for move in range(7):
         if c4.isValidMove(state, move):
             new_state = c4.makeMove(state, player, move)
             val = self.net.predict(c4.getNeuralInput(new_state).reshape(
                 1, 126),
                                    batch_size=1)
             if val > max_value:
                 max_value = val
                 next_move = move
     self.backup(max_value)
     return next_move