Python StateManager.init_new_game 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: state_manager

클래스/타입: StateManager

메소드/함수: init_new_game

hotexamples.com에서의 예제들: 1

Python StateManager.init_new_game - 1개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 state_manager.StateManager.init_new_game에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

StateManager(30)

calculate_next_state(9)

is_finished(4)

add_state(3)

increment_state(3)

get_winner(3)

make_move(3)

push(2)

read(2)

is_legal(2)

load(2)

get_moves(2)

get_legal_moves(2)

get_latest_state(2)

move(2)

player1_won(2)

player2_won(2)

print_board(2)

is_game_over(2)

process_request(2)

convert_to_move(2)

close_db(2)

create_game(2)

redo(1)

setReadyVersion(1)

setVersionStateOnDisk(1)

is_optimal(1)

jsonify(1)

setSubPkgsToRemoveOnRemoval(1)

load_gpi_state(1)

lookup(1)

setRpmsToRemoveOnRemoval(1)

setPilotName(1)

receive_state(1)

setFile(1)

new_state(1)

play_game(1)

save_last_exit(1)

run_for_unittest(1)

run(1)

print_state(1)

probe(1)

set_latest(1)

removeVersion(1)

reimage(1)

start(1)

indexing_constraints(1)

is_last_exit_from_reload(1)

draw_state(1)

getActiveVersion(1)

예제 #1

파일 보기

파일: mcts.py 프로젝트: kristogj/general-purpose-mcts

class MonteCarloSearchTree:
    def __init__(self, game_type, game_config):
        self.state_manager = StateManager(game_type, game_config)
        self.root = None
        self.c = game_config["c"]  # Exploration constant

        self.state_manager.init_new_game()

    def set_root(self, node):
        self.root = node

    def get_augmented_value(self, node, player):
        """
        Calculation needed in order to perform the Tree Policy
        :param node: Node
        :param player: int
        :return: float
        """
        c = self.c if player == 1 else -self.c
        return node.value + c * sqrt(log(node.parent.total) / (1 + node.total))

    def select(self, root):
        """
        Calculate the the augmented value for each child, and select the best path for the current player to take.
        :param root: Node
        :return:
        """
        # Calculate the augmented values needed for the tree policy
        children = [(node, self.get_augmented_value(node, root.player))
                    for node in root.children]

        # Tree Policy = Maximise for P1 and minimize for P2
        if root.player == 1:
            root, value = max(children, key=operator.itemgetter(1))
        else:
            root, value = min(children, key=operator.itemgetter(1))
        return root

    def selection(self):
        """
        Tree search - Traversing the tree from the root to a leaf node by using the tree policy.
        :return: Node
        """
        root = self.root
        children = root.get_children()

        # While root is not a leaf node
        while len(children) != 0:
            root = self.select(root)
            children = root.get_children()

        return root

    def expansion(self, leaf):
        """
        Node Expansion - Generating some or all child states of a parent state, and then connecting the tree node
        housing the parent state (a.k.a. parent node) to the nodes housing the child states (a.k.a. child nodes).
        :return:
        """
        # Get all legal child states from leaf state
        leaf.children = self.state_manager.get_child_nodes(leaf.state)

        # Set leaf as their parent node
        child_player = get_next_player(leaf.player)
        for child in leaf.children:
            child.player = child_player
            child.parent = leaf
        # Tree is now expanded, return the leaf, and simulate to game over
        return leaf

    def simulation(self, node):
        """
        Leaf Evaluation - Estimating the value of a leaf node in the tree by doing a roll-out simulation using the
        default policy from the leaf node’s state to a final state.
        :return: int - The player who won the simulated game
        """
        current_node = node
        children = self.state_manager.get_child_nodes(current_node.state)
        player = node.player
        while len(children) != 0:
            # Use the default policy (random) to select a child
            current_node = random.choice(children)
            player = get_next_player(player)
            children = self.state_manager.get_child_nodes(current_node.state)
        winner = get_next_player(
            player)  # Winner was actually the prev player who made a move
        return int(winner == 1)

    @staticmethod
    def backward(sim_node, z):
        """
        Backward propagation - Passing the evaluation of a final state back up the tree, updating relevant data
        (see course lecture notes) at all nodes and edges on the path from the final state to the tree root.
        :param sim_node: Node - leaf node to go backward from
        :param z: int - 1 if player 1 won, else 0
        :return: None
        """
        node = sim_node
        node.total += 1
        while node.parent:
            node.parent.total += 1
            node.value += (z - node.value) / node.total
            node = node.parent

    def select_actual_action(self, player):
        """
        To select the actual action to take in the game, select the edge with the highest visit count
        :return: Node
        """
        children = [(child, child.value) for child in self.root.children]

        # Tree Policy = Maximise for P1 and minimize for P2
        if player == 1:
            root, value = max(children, key=operator.itemgetter(1))
        else:
            root, value = min(children, key=operator.itemgetter(1))
        return root

    def tree_print(self):
        nodes = [self.root]
        while nodes:
            curr = nodes[0]
            nodes = nodes[1:]
            print((curr.total, curr.player))
            nodes += curr.children