Python Env.get_turn примеры использования

Язык программирования: Python

Пространство имен/Пакет: environment

Класс/Тип: Env

Метод/Функция: get_turn

Примеров на hotexamples.com: 2

Python Env.get_turn - 2 примера найдено. Это лучшие примеры Python кода для environment.Env.get_turn, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Основные методы

Показать Скрыть

Env(30)

step(30)

reset(30)

get_initial_state(7)

render(6)

print_value_all(4)

close(3)

end(3)

plot(3)

save_all_newlines_to_file(2)

take_action(2)

calc_dist(2)

get_turn(2)

get_state(2)

mover(1)

move(1)

DoMove(1)

mostrar_mapa(1)

make(1)

preprocess_img(1)

mainloop(1)

load_sw_set(1)

load_all_doc(1)

is_gameover(1)

plot_goal(1)

print_value_q_all(1)

print_env(1)

print_status(1)

intrinsic_reward(1)

print_values(1)

randomescolha(1)

render_grid(1)

restart_game(1)

rtn_put_available_position(1)

set(1)

set_data_set(1)

setup_logging(1)

tick(1)

toJson(1)

toggle_table(1)

train(1)

inverse(1)

incentive(1)

init_idf(1)

calc_shaped_reward(1)

common_reset(1)

classify(1)

check_win(1)

check_start(1)

check_end(1)

Пример #1

Показать файл

    global_step = 0
    scores, episodes = [], []

    for e in range(EPISODES):
        done = False
        score = 0
        state = env.reset()
        state = np.reshape(state, [1, player1.state_size])

        while not done:
            # env 초기화
            global_step += 1

            # 홀수 턴(qlearning player) - Black
            if env.get_turn() % 2 == 1:
                # 현재 상태에 대한 행동 선택
                action = player1.get_action(state)
                # 선택한 행동으로 환경에서 한 타임스텝 진행 후 샘플 수집
                next_state, reward, done = env.step(BLACK, action)
                '''
				print("Action : ", action)
				print("Reward : ", reward)
				print("Next State : ", next_state)
				print()
				'''
                next_state = np.reshape(next_state, [1, player1.state_size])
                next_action = player1.get_action(next_state)
                # 샘플로 모델 학습
                player1.train_model(state, action, reward, next_state,
                                    next_action, done)

Пример #2

Показать файл

                next_state, reward, done = env.step(BLACK, action)
                next_state = np.reshape(next_state, [1, player.state_size])
                if PRINT_FLAG:
                    print("Action : {0} ==> {1}, {2}".format(
                        action, int(action / 10), action % 10))
                    print("Reward : ", reward)
                    print("Next State : ", next_state)
                    print()
                player.append_sample(state, action, reward)
                score += reward
                state = copy.deepcopy(next_state)

                if PRINT_FLAG:
                    # board 출력
                    print("Episode : {0}, Turn : {1}, PLAYER1".format(
                        e, env.get_turn()))
                    env.draw_board()
                    print()
                    time.sleep(1)
            # White
            else:
                # 현재 상태 획득
                state = env.get_state()
                state = np.reshape(state, [1, player.state_size])
                # 현재 상태에 대한 행동 선택
                action = player.get_action(state)
                # 선택한 행동으로 환경에서 한 타임스텝 진행 후 샘플 수집
                next_state, reward, done = env.step(BLACK, action)
                next_state = np.reshape(next_state, [1, player.state_size])
                if PRINT_FLAG:
                    print("Action : {0} ==> {1}, {2}".format(