Python DQNAgent.fill_memory Examples

Programming Language: Python

Namespace/Package Name: dqn

Class/Type: DQNAgent

Method/Function: fill_memory

Examples at hotexamples.com: 1

Python DQNAgent.fill_memory - 1 examples found. These are the top rated real world Python examples of dqn.DQNAgent.fill_memory extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

DQNAgent(30)

act(13)

load(11)

compile(8)

fit(5)

save(5)

train(5)

replay(5)

test(4)

save_weights(4)

remember(4)

get_action(4)

load_model(4)

actDeterministically(4)

epsilon(3)

save_model(3)

load_weights(3)

target_model(2)

observe(2)

start(2)

get_last_observations(2)

end(2)

train_one_episode(1)

train_model(1)

trainAgent(1)

train_only(1)

update_epoch(1)

update_replay_memory(1)

test_one_episode(1)

test_model(1)

update_target(1)

store_transition(1)

train_rnn(1)

testAgent(1)

update_target_model(1)

train_vae(1)

training(1)

restart_epoch(1)

store_experience(1)

load_state_dict(1)

__init__(1)

act_2(1)

append_sample(1)

backword(1)

fill_memory(1)

get_test_loss(1)

learn(1)

loss(1)

step(1)

parameters(1)

Example #1

Show file

def main():
    z_size=128
    batch_size=32
    learning_rate=0.0001
    vae = CNN(z_size=z_size,
              batch_size=batch_size,
              learning_rate=learning_rate,
              is_training=True,
              reuse=False,
              gpu_mode=False)
    env = 'Breakout-v0'
    done_reward = -1
    gamma = 0.95
    epsilon = 0.05
    save_freq = 10000
    batch_size = 32
    memory_size = 2000
    vae = vae
    rnn = None 
    controller = None
    memory = Memory(memory_size)
    preprocessor = Preprocessor()
    foresee_steps = 1
    DQA = DQNAgent(env = env,
        done_reward = done_reward,
        gamma = gamma,
        epsilon = epsilon,
        save_freq = save_freq,
        batch_size = batch_size,
        memory = memory,
        cnn = vae, 
        controller = controller, 
        preprocessor = preprocessor,
        foresee_steps = foresee_steps,
        #vae_path = 'tf_cnn/cnn.json',
        #rnn_path = 'tf_rnn/rnn.json',
        )
    '''
    tmp_reward = []
    for _ in range(10):
        _, reward = DQA.generate_path(is_random = False)
        tmp_reward.append(reward)
    print(np.mean(tmp_reward))
    '''
    '''
    path, _ = DQA.generate_path(is_random = False)
    DQA.test_vae(path)
    #DQA.test_rnn(path)
    #DQA.test_preprocess(path)
    '''
    o = open('results.txt','w')
    o.write('Start!')
    o.write('\n')
    S = []
    res = DQA.fill_memory(2000, is_random = True)
    S.append(res)
    DQA.train_vae()
    DQA.train_rnn()
    o.write(str(res))
    o.write('\n')
    o.close()
    for i in range(100):
        o = open('results.txt','a')
        DQA.memory.clear()
        res = DQA.fill_memory(300, is_random = False)
        o.write(str(res))
        o.write('\n')
        o.close()
        S.append(res)
        DQA.train_vae()
        DQA.train_rnn()
        print(S)
    
    '''