Python Othello.OthelloEnv示例

编程语言: Python

类/类型: Othello

方法/功能: OthelloEnv

hotexamples.com的示例: 4

Python Othello.OthelloEnv - 已找到4个示例。这些是从开源项目中提取的最受好评的Othello.OthelloEnv现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

Othello(11)

OthelloEnv(4)

Game(2)

black_score(2)

current_player(2)

columns(2)

cell(2)

_turn(1)

_opposite_turn(1)

checkValidAndMove(1)

UCT(1)

countPieces(1)

Othello_game_state(1)

determineWinner(1)

determineWinnerLeast(1)

displayBoard(1)

place_piece(1)

示例#1

显示文件

 def __init__(self):
     super().__init__()
     self.env = Env.OthelloEnv()
     self.initUI()
     self.i = 0
     self.Q = test.Q

示例#2

显示文件

文件： my.py 项目： WangChen0902/Othello

def f(state, action):
    e = Env.OthelloEnv()
    e.state = state
    s, r, d = e._step(action)
    return s, d

示例#3

显示文件

文件： MC.py 项目： WangChen0902/Othello

def main():
    value_list = []
    env = Env.OthelloEnv()
    Value = mc_prediction(random_policy, env, num_episodes=10)
    Value[27] = 1
    Value[28] = 1
    Value[35] = 1
    Value[36] = 1
    for i in range(64):
        value_list.append(Value[i])
    # 现有的根据经验得到的矩阵
    # value_list = [10, -9, 8, 4, 4, 8, -9, 10,
    #               -9, -9, -4, -3, -3, -4, -9, -9,
    #               8, -4, 8, 2, 2, 8, -4, 8,
    #               4, 3, 2, 1, 1, 2, 3, 4,
    #               4, 3, 2, 1, 1, 2, 3, 4,
    #               8, -4, 8, 2, 2, 8, -4, 8,
    #               -9, -9, -4, -3, -3, -4, -9, -9,
    #               10, -9, 8, 4, 4, 8, -9, 10]

    # 打印state矩阵
    for i in range(0, 8):
        for j in range(0, 8):
            print(value_list[8 * i + j], end=' ')
            print()
        print()

    # 下棋开始
    def mid_policy(state, flag):
        st = judge(state, flag)
        l = len(st)
        if (l == 0):
            return [0, 0]
        else:
            action = []
            for i in range(l):
                action.append(value_list[i])
            num = max(action)
            p = action.index(num)
            return [flag, st[p]]

    def f(env):
        total = 0
        s = env._reset()
        flag = 1
        action = mid_policy(s, flag)
        d = False
        while not d:
            s, r, d = env._step(action)
            # for i in range(0,8):
            #             #     for j in range(0,8):
            #             #         if(s[8*i+j]==-1):
            #             #             print(s[8*i+j],end=' ')
            #             #         else:
            #             #             print(s[8*i+j],end='  ')
            #             #     print()
            #             # print()
            flag = -flag
            if (flag == 1):
                action = mid_policy(s, flag)
            else:
                action = random_policy(s, flag)
        for i in range(0, 8):
            for j in range(0, 8):
                total += s[8 * i + j]
        # print(total)
        if (total > 0):
            return 1
        else:
            return 0

    env = Env.OthelloEnv()
    f(env)
    win = 0
    for i in range(1000):
        win += f(env)
    print(win / 1000)

示例#4

显示文件

文件： my.py 项目： WangChen0902/Othello

import sys
import random

from collections import defaultdict
import Othello as Env
from Othello import judge


def random_policy(state, flag):
    st = judge(state, flag)
    l = len(st)
    if l == 0:
        return [0, 0]
    else:
        p = random.randint(0, l - 1)
        return [flag, st[p]]


def f(state, action):
    e = Env.OthelloEnv()
    e.state = state
    s, r, d = e._step(action)
    return s, d


env = Env.OthelloEnv()
env._reset()
ss, dd = f(env.state, random_policy(env.state, 1))
print(ss)
print(dd)