Python Agent.Walk примеры использования

Язык программирования: Python

Пространство имен/Пакет: Agent

Класс/Тип: Agent

Метод/Функция: Walk

Примеров на hotexamples.com: 4

Python Agent.Walk - 4 примера найдено. Это лучшие примеры Python кода для Agent.Agent.Walk, полученные из open source проектов. Вы можете ставить оценку каждому примеру, чтобы помочь нам улучшить качество примеров.

Основные методы

Показать Скрыть

__init__(30)

act(30)

Agent(30)

Solve(15)

Walk(4)

averagePathLength(3)

TargetPotentialForce(3)

start(2)

pluckTillConnected(2)

infiniteRadium(2)

Prod(2)

Perceive(2)

decide(2)

randomRangeRadiumUnif(2)

SwarmPotentialForce(2)

GetNextState(2)

Util(2)

DoNothing(2)

Clean(2)

groupSize(2)

edgeOccupation(1)

draw(1)

constRadium(1)

isConnected(1)

getRandomVertexPair(1)

getState(1)

make_typo_mistake(1)

pluck(1)

pluckEdge(1)

print_params(1)

randomRangeRadiumNormal(1)

recover(1)

removeEdge(1)

setChannel(1)

setName(1)

setState(1)

set_continuum(1)

changeURL(1)

ASTAR(1)

addEdge(1)

MoveRight(1)

BFS(1)

DQNepisode(1)

ExecuteMovement(1)

GetActions(1)

GetLocationX(1)

GetLocationY(1)

MoveDown(1)

MoveLeft(1)

MoveRandom(1)

Пример #1

Показать файл

    def doAction(self, chaser: Agent, target: Agent, grid: GridMap,
                 state: State):

        #状態を記録
        now_st = state.getState(chaser, target)
        self.st.append(now_st)

        #行動の決定
        action = -1
        p = random.random()
        if p < epsilon or (not np.any(
                self.q[now_st[0]][now_st[1]][now_st[2]])):
            while True:
                action = random.randint(0, 3)
                if state.canMoveDirection(target, grid, action):
                    break
        else:
            max_q = -100000000
            for i in range(4):
                if max_q < self.q[now_st[0]][now_st[1]][
                        now_st[2]][i] and state.canMoveDirection(
                            target, grid, i):
                    max_q = self.q[now_st[0]][now_st[1]][now_st[2]][i]
                    action = i

        #行動を実行・記録
        target.Walk(action)
        self.act.append(action)

        #次状態のエージェントを予測
        tmp_chaser = copy.deepcopy(chaser)
        tmp_target = copy.deepcopy(target)
        tmp_state = copy.deepcopy(state)

        tmp_target.Walk(action)
        tmp_chaser.Walk(tmp_state.nextDirection(chaser, target, grid))

        next_st = state.getState(tmp_chaser, tmp_target)

        #Q値更新
        nextMax_q = -100000000
        p = random.random()
        if p < epsilon or (not np.any(
                self.q[next_st[0]][next_st[1]][next_st[2]])):
            while True:
                next_action = random.randint(0, 3)
                if state.canMoveDirection(target, grid, next_action):
                    nextMax_q = nextMax_q = self.q[next_st[0]][next_st[1]][
                        next_st[2]][next_action]
                    break
        else:
            for i in range(4):
                if nextMax_q < self.q[next_st[0]][next_st[1]][
                        next_st[2]][i] and grid.canMove(
                            next_st[0] + dx[i], next_st[1] + dy[i]):
                    nextMax_q = self.q[next_st[0]][next_st[1]][next_st[2]][i]

        self.q[now_st[0]][now_st[1]][now_st[2]][action] = (1 - alpha) * self.q[
            now_st[0]][now_st[1]][now_st[2]][action] + alpha * (self.getReward(
                tmp_chaser, tmp_target, tmp_state) + ganma * nextMax_q)

Пример #2

Показать файл

  def greedy_doAction(self, chaser:Agent, target:Agent, grid:GridMap, state:State):
    now_st = state.getState(chaser, target)

    action = 0
    max_q = -100000000
    for i in range(4):
      if max_q < self.q[now_st[0]][now_st[1]][now_st[2]][i] and state.canMoveDirection(target, grid, i):
        max_q = self.q[now_st[0]][now_st[1]][now_st[2]][i]
        action = i
    
    target.Walk(action)

Пример #3

Показать файл

 def doAction(self, chaser:Agent, target:Agent, grid:GridMap, state:State):
   
   #状態を記録
   now_st = state.getState(chaser, target)
   self.st.append(now_st)
   
   #行動の決定
   action = -1
   p = random.random()
   if p < epsilon or (not np.any(self.q[now_st[0]][now_st[1]][now_st[2]])):
     while True:
       action = random.randint(0,3)
       if state.canMoveDirection(target, grid, action):
         break
   else:
     max_q = -100000000
     for i in range(4):
       if max_q < self.q[now_st[0]][now_st[1]][now_st[2]][i] and state.canMoveDirection(target, grid, i):
         max_q = self.q[now_st[0]][now_st[1]][now_st[2]][i]
         action = i
   
   #行動を実行・記録
   target.Walk(action)
   self.act.append(action)

Пример #4

Показать файл

Файл: Controller.py Проект: ChanYu1224/EscaperEducation

    def chaseTarget(self, chaser: Agent, target: Agent, grid: GridMap,
                    state: State):

        dire = state.nextDirection(chaser, target, grid)
        chaser.Walk(dire)