Exemple #1
0
def TrainNode(board, root, iterNum, cur_player, step):
    for i in range(iterNum):
        # print(i)
        SumNum = root.N  # 树的根节点的访问次数,如果已经下了一步棋,就把其他的children给删除
        node = root  # node作为指向root的指针
        temp_player = cur_player
        while node.isExpand() == True:  # 已扩展,不是叶子节点
            # 有孩子
            if node.children:  # 要进入就为真,当存在值的时候为真
                CalculateUCB1(node, SumNum)  # 计算node所有孩子的UCB1值
                index = MaxUCB1(node)  # 获得node孩子中的UCB1值最大的那个节点的下标
                node = node.children[index]  # 把指针指向最大的孩子
            # 没有孩子
            else:
                temp_player = -node.player
                node = game.PossibleMove(node.Board, node, temp_player)
                if not node.children:
                    break
        # 未扩展,是叶子节点?
        value = Rollout(
            node, cur_player, node.Board
        )  # 获得叶子节点后,对节点进行rollout,获得最终的value,其中,要将node的Expand值改为True
        BackUp(node, value, cur_player)  # 对叶子节点和它的所有的祖先的value和N都更新一遍
    # 扩展结束后,选择root的孩子中最大的那个
    index = MaxUCB1(root)
    # 选择了之后,就把同一个父母的其他孩子给删除
    DeleteChildren(root, index, step)
    # return index
    return
Exemple #2
0
def BackUp(node, value, cur_player):
    node.addValue(value)
    node.setExpand(True)
    node.addN(1)
    # 可以优化的地方
    if not node.children:
        node = game.PossibleMove(node.Board, node, -node.player)
    while node.parent:  # 如果节点存在父节点,就把值往回传
        node.parent.addValue(value)
        node.parent.addN(1)
        node = node.parent
Exemple #3
0
def isTurn(node, cur_player, step):
    temp_node = node
    for i in range(step):
        temp_node = temp_node.children[0]
    if not temp_node.children:
        tree = game.PossibleMove(temp_node.Board, temp_node, -temp_node.player)
    else:
        tree = temp_node
    if tree.children:
        return True
    else:
        return False
Exemple #4
0
def Rollout(node, cur_player, board):
    # 进行一个快速的选择,随机选择children并深入,直到游戏结束
    temp_board = copy.deepcopy(board)
    temp_player = -cur_player
    list = []
    # subTree=node
    flag = 1
    while game.isTerminal(temp_board, temp_player) == False:
        # 因为都是叶子节点,所以没有孩子,并且孩子不放入正式的树中
        list.clear()
        # 这里可以优化,不过现在先不动
        if node.children:
            list = node.children
        else:
            node = game.PossibleMove(temp_board, node, temp_player)
            list = node.children

        if list:  # 如果list中有内容,那么就随机选择能下的地方并下
            index = getRandomChild(len(list))  # 随机选择了能下的地方
            # 将棋盘更新为选择的棋盘,将下棋的人变更。将
            temp_board = node.children[index].Board
            temp_player = -node.children[index].player
            node = node.children[index]

        else:  # 如果没有地方可以下,那么就换成对方下棋
            temp_player = -temp_player
            # print("temp_player:"+str(temp_player))
            if flag == 1:
                flag = flag - 1
            elif flag == 0:
                break

    # 当下棋结束,统计现有棋面上各个子的数量
    blackNum = 0
    whiteNum = 0
    for i in range(8):
        for j in range(8):
            if temp_board[i][j] == 1:
                blackNum = blackNum + 1
            elif temp_board[i][j] == -1:
                whiteNum = whiteNum + 1
    # 因为只有黑子是需要进行rollout的,所以只返回黑子的最终value
    return blackNum - whiteNum
Exemple #5
0
    pygame.init()
    screen = pygame.display.set_mode((canvas_w, canvas_h))
    pygame.display.set_caption("翻转棋")

    FPS = 30
    clock = pygame.time.Clock()

    # 加载背景图片
    base_folder = os.path.dirname(__file__)
    bg_img = pygame.image.load(os.path.join(base_folder,
                                            "boardBG.jpg")).convert()

    board = game.Init(ChessBoard)
    root = Chess.Node()  # root就是棋盘初始的样子,判定条件为没有parents
    root = game.PossibleMove(board, root, cur_player)
    root.Board = board

    while True:
        drawChessBoard(screen)
        pygame.display.update()
        clock.tick(FPS)
        if StartFlag == 1:
            if game.isTerminal(board, cur_player) == True:
                cur_player = 2
            if cur_player == 1:
                print("black")
                if isTurn(root, cur_player, step) == False:
                    cur_player = -1
                temp_board = copy.deepcopy(board)
                time_start = time.time()