Esempi in Python per Maze.after

Linguaggio di programmazione: Python

Spazio dei nomi/nome del pacchetto: maze

Classe/tipologia: Maze

Metodo/funzione: after

Esempi su hotexamples.com: 6

Maze.after in Python: 6 esempi trovati. Questi sono i migliori esempi reali in Python per maze.Maze.after, estratti da progetti open source. Li puoi valutare, per aiutarci a migliorare la qualità dei nostri esempi.

Metodi utilizzati di frequente

Mostra Nascondi

Maze(30)

add_room(9)

after(6)

blit(5)

__get_rectangle_coords__(4)

__init__(4)

_apply_valid_move_constraint(4)

DFS(2)

atExit(2)

Solve(2)

add_canvas(2)

_set_start_and_end(2)

_to_str_matrix(2)

bfsPathFinder(1)

beginMaze(1)

bfs(1)

bestQ(1)

avatarCoodinate(1)

fromJSON(1)

getSize(1)

getItem(1)

getPos(1)

as_image(1)

get_reachables(1)

load_level(1)

makeMap(1)

parse(1)

pretty_print(1)

repaint(1)

setExist(1)

astarPathFinder(1)

all_edges(1)

apply(1)

add_cell(1)

Qtable(1)

__repr__(1)

__str__(1)

_color(1)

_set_borders(1)

_set_inner_walls(1)

a_star_search(1)

act(1)

add_obstical(1)

animate_state_values_history(1)

add_row(1)

add_square(1)

add_to_map(1)

advance(1)

allSolutionsDFSRec(1)

allSolutionsFoundDFS(1)

Esempio n. 1

Mostra file

def update():
    for episode in range(Max_Episodes):
        # Initial oberservation
        observation = env.reset()
        
        while True:
            # Fresh env
            env.render()
            # RL choose actions
            action = RL.choose_action(str(observation))
            # RL take action and get next observation and reward
            observation_, reward, done = env.step(action)
            # Save the transition from S to S'
            RL.learn(str(observation), action, reward, str(observation_))
            # Swap observation
            observation = observation_

            if done:
                break
        
    print('game over')
    env.destroy()

if __name__ == "__main__":
    env = Maze()
    RL = QLearningTable(actions = list(range(env.n_actions)))
    
    env.after(100, update)
    env.mainloop()

Esempio n. 2

Mostra file

File: main.py Progetto: KendrickAng/rl-tabular-q-learning

                RL.learn()

            # swap observation
            observation = observation_

            # break while loop when end of this episode
            if done:
                break
            step += 1

    # end of game
    print('game over')
    env.destroy()


if __name__ == "__main__":
    # maze game
    env = Maze()
    RL = DeepQNetwork(
        env.n_actions,
        env.n_features,
        learning_rate=0.01,
        reward_decay=0.9,
        e_greedy=0.9,
        replace_target_iter=200,
        memory_size=2000,
        # output_graph=True
    )
    env.after(100, run_maze)
    env.mainloop()
    RL.plot_cost()

Esempio n. 3

Mostra file

File: main.py Progetto: msdnqqy/RL

            action = rl.choose_action(state_str, avaliable_actions)  #选择动作
            reward, state_next, is_success = maze.step(action)  #获取环境奖励

            state_next_str_arr = np.array(state_next) / maze.unit

            state_next_str = str(state_next_str_arr.tolist())

            rl.update(state_str, action, state_next_str, reward, is_success,
                      steps)  #更新状态
            steps.append([state_str, action])  #存储经历，后续学习
            maze.render()
            maze.write_weight(rl.state_table)

        print('run end {0}'.format(j))
        print(rl.state_table.round(2))
        time.sleep(0.5)

        # maze.write_weight(rl.state_table)
        #进行强制更新，更新全部路径的权重多次训练之后就能够得到优秀权重
        # rl.forceUpdate(steps,reward/10)
        print("forceUpdate")
        # print(rl.state_table.round(2))


if __name__ == '__main__':
    maze = Maze(8, 6, chif=15)
    rl = RLbrain(maze.get_all_action())  #获取所有动作
    maze.after(100, render)
    maze.mainloop()

Esempio n. 4

Mostra file

File: main.py Progetto: KendrickAng/rl-tabular-q-learning

    for episode in range(100):
        # initial observation
        s_curr = maze._reset_maze()

        while True:
            maze._render()

            # Get next action from the Q-table
            action = rl.select_next_action(str(s_curr))

            # take the action and observe the next state and reward
            s_next, reward, isDone = maze._update_maze(action)

            # learn from the feedback
            rl.learn(str(s_curr), action, reward, str(s_next))

            s_curr = s_next
            if isDone:
                break

    print("Game over")
    maze.destroy()


if __name__ == "__main__":
    maze = Maze()
    rl = QLearningTable(actions=list(range(len(maze.action_space))))

    maze.after(100, update)
    maze.mainloop()

Esempio n. 5

Mostra file

File: main.py Progetto: HITLB17/basic_RL

        s = env.reset()
        while True:
            env.render()
            a = RL.choose_action(str(s))
            s_, r, done = env.step(a)
            RL.learn(str(s), a, r, str(s_))

            # use a model to output (r, s_) by inputting (s, a)
            # the model in dyna Q version is just like a memory replay buffer
            env_model.store_transition(str(s), a, r, s_)
            for n in range(10):  # learn 10 more times using the env_model
                ms, ma = env_model.sample_s_a()  # ms in here is a str
                mr, ms_ = env_model.get_r_s_(ms, ma)
                RL.learn(ms, ma, mr, str(ms_))

            s = s_
            if done:
                break

    # end of game
    print('game over')
    env.destroy()


if __name__ == "__main__":
    env = Maze()
    RL = QLearningTable(actions=list(range(env.n_actions)))
    env_model = EnvModel(actions=list(range(env.n_actions)))

    env.after(0, update)
    env.mainloop()

Esempio n. 6

Mostra file

        observation = env.reset()
        while True:
            # Fresh env
            env.render()
            # RL choose actions
            action = RL.choose_action(str(observation))
            # RL take action and get next observation and reward
            observation_, reward, done = env.step(action)
            # Save the transition from S to S'
            RL.learn(str(observation), action, reward, str(observation_))
            # Swap observation
            observation = observation_
            if done:
                break
    print('game over')
    env.destroy()


if __name__ == "__main__":
    env = Maze()
    if Algorithm == 'SarsaLambda':
        RL = SarsaLambda(action_space=list(range(env.n_actions)))
        env.after(100, update_Sarsa)
    elif Algorithm == 'Q_learning':
        RL = Q_learning(action_space=list(range(env.n_actions)))
        env.after(100, update)
    elif Algorithm == 'Sarsa':
        RL = Sarsa(action_space=list(range(env.n_actions)))
        env.after(100, update_Sarsa)
    env.mainloop()