def greedy(self, state): maxval = float('-inf') maxmove = None for i in range(7): if c4.isValidMove(state, i): new_state = c4.makeMove(state, self.player, i) val = self.lookup(new_state) if val > maxval: maxval = val maxmove = i self.backup(maxval) return maxmove
def greedy(self, state, player=1): max_value = float("-inf") next_move = None # TODO: implemen get_possible_moves in c4 for move in range(7): if c4.isValidMove(state, move): new_state = c4.makeMove(state, player, move) val = self.net.predict(c4.getNeuralInput(new_state).reshape(1, 126), batch_size=1) if val > max_value: max_value = val next_move = move self.backup(max_value) return next_move
def greedy(self, state, player=1): max_value = float("-inf") next_move = None # TODO: implemen get_possible_moves in c4 for move in range(7): if c4.isValidMove(state, move): new_state = c4.makeMove(state, player, move) val = self.net.predict(c4.getNeuralInput(new_state).reshape( 1, 126), batch_size=1) if val > max_value: max_value = val next_move = move self.backup(max_value) return next_move