Python ReplayBuffer.get_minibatch Exemples

Langage de programmation: Python

Espace de nommage/Pack: replay_buffer

Class/Type: ReplayBuffer

Méthode/Fonction: get_minibatch

Exemples au hotexamples.com: 1

Python ReplayBuffer.get_minibatch - 1 exemples trouvés. Ce sont les exemples réels les mieux notés de replay_buffer.ReplayBuffer.get_minibatch extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

ReplayBuffer(30)

add(30)

count(26)

get_batch(25)

append(17)

encode_recent_observation(7)

getBatch(7)

add_sample(7)

insert(7)

clear(6)

load(5)

load_memory(5)

can_sample(4)

add_episode(4)

add_transition(4)

get_last_steps(3)

get_size(3)

create_batch(3)

is_ready(3)

add_experience(3)

add_to_memory(2)

make_index(2)

compute_values(2)

compute_value_difference(2)

compute_reward_distances(2)

compute_returns(2)

compute_lambda_returns(2)

fetch_sample(2)

compute_episode_boundaries(2)

encoder_recent_observation(2)

idx(2)

get_batch_data(1)

get_current_size(1)

get_experiences(1)

get_len(1)

get_current_state(1)

load_replay(1)

get_losses_offline(1)

get_memory(1)

get_minibatch(1)

importance_sampling(1)

in_order_iterate(1)

insert_sample(1)

k(1)

length(1)

lenth(1)

load_from_file(1)

get_random_minibatch(1)

dump(1)

get(1)

Méthodes fréquemment utilisées

ReplayBuffer (30)

add (30)

count (26)

get_batch (25)

append (17)

encode_recent_observation (7)

getBatch (7)

add_sample (7)

insert (7)

clear (6)

Méthodes fréquemment utilisées

load (5)

load_memory (5)

can_sample (4)

add_episode (4)

add_transition (4)

get_last_steps (3)

get_size (3)

create_batch (3)

is_ready (3)

add_experience (3)

add_to_memory (2)

make_index (2)

compute_values (2)

compute_value_difference (2)

compute_reward_distances (2)

compute_returns (2)

compute_lambda_returns (2)

fetch_sample (2)

compute_episode_boundaries (2)

encoder_recent_observation (2)

Méthodes fréquemment utilisées

add_to_memory (2)

make_index (2)

compute_values (2)

compute_value_difference (2)

compute_reward_distances (2)

compute_returns (2)

compute_lambda_returns (2)

fetch_sample (2)

compute_episode_boundaries (2)

encoder_recent_observation (2)

idx (2)

get_batch_data (1)

get_current_size (1)

get_experiences (1)

get_len (1)

get_current_state (1)

load_replay (1)

get_losses_offline (1)

get_memory (1)

get_minibatch (1)

importance_sampling (1)

in_order_iterate (1)

insert_sample (1)

k (1)

length (1)

lenth (1)

load_from_file (1)

get_random_minibatch (1)

dump (1)

get (1)

Méthodes fréquemment utilisées

idx (2)

get_batch_data (1)

get_current_size (1)

get_experiences (1)

get_len (1)

get_current_state (1)

load_replay (1)

get_losses_offline (1)

get_memory (1)

get_minibatch (1)

importance_sampling (1)

in_order_iterate (1)

insert_sample (1)

k (1)

length (1)

lenth (1)

load_from_file (1)

get_random_minibatch (1)

dump (1)

get (1)

batch_load (1)

_count (1)

_ptr (1)

addAbsorbing (1)

add_batch (1)

add_data (1)

add_datapoints (1)

add_effects (1)

add_errors (1)

add_expert (1)

add_tuples (1)

adds (1)

as_dataset (1)

buffer_init (1)

full (1)

buffered (1)

cache (1)

clear_buffer (1)

create_episode (1)

current_count (1)

Exemple #1

0

Afficher le fichier

Fichier : test_replay_buffer.py Projet : kastnerkyle/replay_buffer_testing

def test_full_run(): from atari_py.ale_python_interface import ALEInterface game = "atari_roms/breakout.bin" ale = ALEInterface() # Get & Set the desired settings ale.setInt('random_seed', 123) # Load the ROM file ale.loadROM(game) # Get the list of legal actions legal_actions = ale.getLegalActionSet() batch_size = 10 exp_replay = ReplayBuffer(batch_size) (screen_width, screen_height) = ale.getScreenDims() import os tot_m, used_m, free_m = os.popen("free -th").readlines()[-1].split()[1:] last_counter = 0 random_state = np.random.RandomState(218) print("initial: {}, {}, {}".format(tot_m, used_m, free_m)) # Play 2k episodes for episode in range(2000): total_reward = 0 S = np.zeros(screen_width * screen_height, dtype=np.uint8) S = S.reshape(screen_height, screen_width)[:84, :84] this_counter = exp_replay.sent_counter if this_counter > last_counter + 1000: last_counter = this_counter tot_m, used_m, free_m = os.popen( "free -th").readlines()[-1].split()[1:] # the first three entries should match til 1M steps # then the second 2 should continue in lock step print("{}: {}, {}; {}, {}, {}".format( exp_replay.sent_counter, len(exp_replay.memory), len(exp_replay.reverse_experience_lookup.keys()), tot_m, used_m, free_m)) while not ale.game_over(): S_prime = np.zeros(screen_width * screen_height, dtype=np.uint8) ale.getScreen(S_prime) S_prime = S_prime.reshape(screen_height, screen_width)[:84, :84] a = random_state.choice(len(legal_actions)) action = legal_actions[a] # Apply an action and get the resulting reward reward = ale.act(action) won = 0 ongoing_flag = 1 experience = (S_prime, action, reward, won, ongoing_flag) S = S_prime exp_replay.add_experience(experience) batch = exp_replay.get_minibatch() batch = exp_replay.get_minibatch(index_list=[1, 2, 3, 10, 11]) if batch is not None: mb_S = batch[0] other_info = batch[1] del batch total_reward += reward print 'Episode', episode, 'ended with score:', total_reward ale.reset_game() lst = 0 for i in range(10000): if i > lst + 1000: tot_m, used_m, free_m = os.popen( "free -th").readlines()[-1].split()[1:] print("POST MEM {}: {}, {}; {}, {}, {}".format( exp_replay.sent_counter, len(exp_replay.memory), len(exp_replay.reverse_experience_lookup.keys()), tot_m, used_m, free_m)) lst = i batch = exp_replay.get_minibatch() mb_S = batch[0] other_info = batch[1] from IPython import embed embed() raise ValueError()