Python Actor.build_net Examples

Programming Language: Python

Namespace/Package Name: Actor

Class/Type: Actor

Method/Function: build_net

Examples at hotexamples.com: 2

Python Actor.build_net - 2 examples found. These are the top rated real world Python examples of Actor.Actor.build_net extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Actor(30)

__init__(15)

train(15)

parameters(14)

choose_action(8)

learn(8)

predict(7)

train_fn(6)

eval(6)

state_dict(5)

load_state_dict(4)

load(4)

_loss_(3)

update(3)

setPos(2)

ChooseActionByPolicy(2)

save(2)

setcollaabb(2)

sethitaabb(2)

get_shortest_actor(2)

model(2)

build_net(2)

doAttack(1)

target_predict(1)

save_cache(1)

setLocation(1)

addtriumphs(1)

setUnqTags(1)

set_brain(1)

set_goal(1)

setaabb(1)

addedToWorld(1)

add_grad_to_graph(1)

addMovie(1)

stop(1)

take_damage_shortest_point(1)

target_actions(1)

target_predict_method(1)

run(1)

transfer_to_actor_model(1)

update_target(1)

update_actor_target(1)

updatePolicy(1)

act(1)

unpickleActors(1)

triumph(1)

train_p(1)

target_update_method(1)

action(1)

train_2(1)

Example #1

Show file

File: Actor_critic_tsf_config.py Project: liulu112601/Deep-Learning-First-Taste

def run():
    # build environment using openai gym
    env = gym.make('MountainCar-v0')
    env = env.unwrapped
    sess = tf.Session()
    # create an actor and critic
    actor = Actor(sess, n_actions=n_actions, n_features=n_features, lr=lr_actor)
    critic = Critic(sess, n_features=n_features, lr=lr_critic)
    # build the two networks
    actor.build_net()
    critic.build_net()

    sess.run(tf.global_variables_initializer())

    # tf.summary.FileWriter("",sess.graph)
    # count steps
    step = 0
    # env.render()
    for episode in range(n_episodes):
        s = env.reset()
        # comment the render() to speed up
        # env.render()
        # s returned by gym is a vector, we need to transform it into a matrix
        s = s[np.newaxis, :]
        a = actor.choose_action(s)
        while (True):
            step += 1
            # a new transition
            s_, r, done, info = env.step(a)
            # in order to let s_ add one rank(matrix)
            s_ = s_[np.newaxis, :]
            a_ = actor.choose_action(s_)
            # calculate td_error
            td_error = critic.learn(s, s_)
            actor.learn(s, a, td_error)
            s = s_

            if step % 500 == 0:
                print(step, s_)

            if done:
                print('arrive')
                print(s_)
                break

Example #2

Show file

File: Actor_critic_tsf.py Project: liulu112601/Deep-Learning-First-Taste

#position and velocity
n_features = 2
#0,1,2
n_actions = 3
n_episode = 1000

if __name__ == '__main__':
    #build environment using openai gym
    env = gym.make('MountainCar-v0')
    env = env.unwrapped
    sess = tf.Session()
    #create an actor and critic
    actor = Actor(sess,n_actions=n_actions,n_features=n_features,lr=lr_actor)
    critic = Critic(sess,n_features=n_features,lr=lr_critic)
    #build the two networks
    actor.build_net()
    critic.build_net()

    sess.run(tf.global_variables_initializer())

    #tf.summary.FileWriter("",sess.graph)
    #count steps
    step = 0
    #env.render()
    for episode in range(n_episode):
        s = env.reset()
        #comment the render() to speed up
        #env.render()
        #s returned by gym is a vector, we need to transform it into a matrix
        s = s[np.newaxis, :]
        a = actor.choose_action(s)