Exemplo n.º 1
0
    sys.path.append('..')

from game import Game
from game import GameEnv
import numpy as np
from utils import dump
import os
import shutil

path = 'train'

for cnt in range(30):
    env = GameEnv()
    games = [Game(env, player) for player in range(3)]
    datas = [[env.hand_cards(), None, None] for _ in range(3)]
    while not env.game_over():
        period = env.period()
        if period != 3:
            curr_player = env.curr_player()
            game = games[curr_player]
            action = np.random.choice(game.action_list())
            for game in games:
                game.move(action)
            env.move(action)
        else:
            for player, game in enumerate(games):
                response = env.response(player)
                game.move(response)
            env.move(-1)
    for data, game in zip(datas, games):
        data[1] = game.policy()
Exemplo n.º 2
0
def match(AIs):
    def read(popen):
        while True:
            output = popen.stdout.readline()
            if output is not None:
                return output.decode('utf-8')

    def write(popen, obj):
        if popen == AIs[args.p]:
            return
        popen.stdin.write((str(obj) + '\n').encode('utf-8'))
        popen.stdin.flush()

    (name0, simulation0), (name1, simulation1), (name2,
                                                 simulation2) = players_attr
    write(AIs[0], name0)
    write(AIs[0], simulation0)

    write(AIs[1], name1)
    write(AIs[1], simulation1)

    write(AIs[2], name2)
    write(AIs[2], simulation2)

    env = GameEnv()
    hand_cards = env.hand_cards()

    data.append(env.hand_cards())
    game = Game(env, args.p)

    for player in range(3):
        write(AIs[player], list(hand_cards.flatten()))
    slot = []
    ig = False

    print('Filename:', filename)
    print('Your position:', args.p)
    print('Your hand cards:', to_chars(hand_cards[args.p]))

    while not env.game_over():
        period = env.period()
        player = env.curr_player()
        if period == 1 and player == args.p:
            print('Your position:', args.p)
            print('Your hand cards:', to_chars(env.hand_cards()[args.p]))
            print('Hand cards num of 3 players:', env.hand_cards_num())
            print('-----')
        if period == 1 or period == 2:
            if player == args.p:
                if period == 1:
                    _game = game.copy()
                    print('Your turn:', end=' ')
                    chars = input()
                    try:
                        if chars == 'pass':
                            actions = [0]
                        else:
                            chars = chars.upper().rstrip().replace(
                                ',', '').split(' ')
                            while '' in chars:
                                chars.remove('')
                            # for char in chars:
                            # 	if char not in card_dict:
                            # 		raise KeyError('input error')
                            actions = to_action(chars)
                        for action in actions:
                            if action in _game.action_list():
                                _game.move(action)
                            else:
                                raise RuntimeError('couldn\'t move')
                    except (RuntimeError, KeyError):
                        print('Invalid action! Please retry.')
                        print('=====')
                        continue
                    game = _game

                    for action in actions:
                        env.move(action)
                        for target in range(3):
                            write(AIs[target], action)
                    print('=====')
                if period == 2:
                    print('Your bet:', end=' ')
                    action = int(input()) + 352
                    if action not in game.action_list():
                        print('Invalid action! Please retry.')
                        continue
                    env.move(action)
                    game.move(action)
                    for target in range(3):
                        write(AIs[target], action)
            else:
                action = int(read(AIs[player]))
                # print(action)
                env.move(action)
                game.move(action)
                for target in range(3):
                    if target != player:
                        write(AIs[target], action)
                if period == 1:
                    slot += to_chars(Action(action).to_array()).replace(
                        '[', '').replace(']', '').replace(',', '').split(' ')
                    if env.curr_player() != player:
                        if action == 0:
                            print('Player%d pass' % player)
                        else:
                            print('Player%d\'s turn:' % player,
                                  str(slot).replace('\'', ''))
                        print('=====')
                        slot = []
                if period == 2:
                    print('Player%d\'s bet: %d' % (player, action - 352))
            if period == 2 and env.period() == 3:
                print('Landlord is Player%d' % env.lord_player())
                print('Bottom cards:', to_chars(env.bottom()))
                print('===== Game Start =====')
        if period == 3:
            for player in range(3):
                write(AIs[player], env.response(player))
            game.move(env.response(args.p))
            env.move(-1)
    evals = [None, None, None]
    for player in range(3):
        if player != args.p:
            evals[player] = (float(read(AIs[player])) + 1) / 2
            AIs[player].terminate()
    # print(evals)
    data.append(game.policy())
    with open('human/%s.pkl' % filename, 'wb') as f:
        pickle.dump(data, f)

    if args.p == env.lord_player():
        is_winner = env.hand_cards_num()[args.p] == 0
    else:
        is_winner = env.hand_cards_num()[env.lord_player()] != 0
    if game.lord_player() == -1:
        print('<<<<<<<<<<<<<<< DRAW >>>>>>>>>>>>>>>')
    elif is_winner:
        print('<<<<<<<<<<<<<<< YOU WIN >>>>>>>>>>>>>>>')
    else:
        print('<<<<<<<<<<<<<<< YOU LOSE >>>>>>>>>>>>>>>')