Python GridWorld.render Examples

Programming Language: Python

Namespace/Package Name: GridWorld

Class/Type: GridWorld

Method/Function: render

Examples at hotexamples.com: 2

Python GridWorld.render - 2 examples found. These are the top rated real world Python examples of GridWorld.GridWorld.render extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

GridWorld(30)

move(4)

bestMove(4)

reset(4)

printValueGrid(4)

printReturnGrid(4)

printPolicyGrid(4)

possibleMoves(4)

gameOver(3)

scan_grid_and_generate_graph(2)

save_graph(2)

render(2)

print_graph(2)

setDiscountFactor(2)

after(2)

createSquareCount(2)

create_grid_ui(2)

getActions(1)

printQValues(1)

move_on_given_route_aco(1)

move_on_given_route_genetic(1)

players(1)

get(1)

printPolicy(1)

generateWalls(1)

dfs_route(1)

generateGoals(1)

move_on_given_route(1)

printValues(1)

print_map(1)

randomAction(1)

cells(1)

addRandomObstacles(1)

move_on_given_route_a_star(1)

getAccessibleCells(1)

getAgentPose(1)

get_next_state(1)

getLength(1)

getPoseFromAction(1)

getPredFromPose(1)

getState(1)

getStateSpace(1)

getTotalSteps(1)

get_grid_world(1)

get_number_of_actions(1)

make_grid_world(1)

get_number_of_states(1)

get_rewards(1)

addAgent(1)

gridDefine(1)

Example #1

Show file

sess = tf.Session()

actor = Actor(sess, n_features=n_features, n_actions=n_actions, lr=lr_actor)
critic = Critic(sess, n_features=n_features, lr=lr_critic)

sess.run(tf.global_variables_initializer())

for i_episode in range(MAX_EPISODE):
    _, state = env.reset()
    step = 0
    track_r = []
    while True:

        action = actor.choose_action(state)
        _, next_state, reward, done = env.step(action)
        env.render()
        track_r.append(reward)

        td_error = critic.learn(state, reward, next_state)
        actor.learn(state, action, td_error)
        state = next_state
        step += 1

        if done or step >= MAX_EP_STEPS:
            ep_rs_sum = sum(track_r)
            if 'running_reward' not in globals():
                running_reward = ep_rs_sum
            else:
                running_reward = running_reward * 0.95 + ep_rs_sum * 0.05
            print("episode:", i_episode, "step:", step, "  reward:", int(running_reward))
            break

Example #2

Show file

File: sarsa_agent.py Project: guroosh/CS7IS2-AI-project

    grid_world.create_grid_ui(grid_world.m, grid_world.n,
                              (grid_world.start_x, grid_world.start_y),
                              (grid_world.end_x, grid_world.end_y),
                              grid_world.obstacles)

    agent = SARSAgent(actions=list(range(grid_world.action_size)))
    number_of_episodes = 10
    for episode in range(number_of_episodes):
        # reset environment and initialize state

        state = grid_world.reset()
        # get action of state from agent
        action = agent.get_action(str(state))

        while True:
            grid_world.render()

            # take action and proceed one step in the environment
            next_state, reward, done = grid_world.step(action)
            next_action = agent.get_action(str(next_state))

            # with sample <s,a,r,s',a'>, agent learns new q function
            agent.learn(str(state), action, reward, str(next_state),
                        next_action)

            state = next_state
            action = next_action

            # print q function of all states at screen
            #env.print_value_all(agent.q_table)