Python Batch.cat_list Exemples

Langage de programmation: Python

Espace de nommage/Pack: tianshou.data

Class/Type: Batch

Méthode/Fonction: cat_list

Exemples au hotexamples.com: 2

Python Batch.cat_list - 2 exemples trouvés. Ce sont les exemples réels les mieux notés de tianshou.data.Batch.cat_list extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

Batch(30)

split(30)

weight(28)

pop(23)

returns(17)

stack(14)

update(11)

cat(9)

rew(9)

obs(8)

get(7)

act(7)

to_torch(6)

logp_old(6)

done(6)

cat_(6)

append(5)

adv(5)

is_empty(5)

keys(3)

to_numpy(3)

items(3)

obs_next(2)

update_weight(2)

empty_(2)

empty(2)

cat_list(2)

v_s(2)

v(2)

b(2)

values(1)

value_targets(1)

advantages(1)

loss(1)

policy(1)

stack_(1)

__repr__(1)

info(1)

indice(1)

Méthodes fréquemment utilisées

Batch (30)

split (30)

weight (28)

pop (23)

returns (17)

stack (14)

update (11)

cat (9)

rew (9)

obs (8)

Méthodes fréquemment utilisées

get (7)

act (7)

to_torch (6)

logp_old (6)

done (6)

cat_ (6)

append (5)

adv (5)

is_empty (5)

keys (3)

to_numpy (3)

items (3)

obs_next (2)

update_weight (2)

empty_ (2)

empty (2)

cat_list (2)

v_s (2)

v (2)

b (2)

Méthodes fréquemment utilisées

to_numpy (3)

items (3)

obs_next (2)

update_weight (2)

empty_ (2)

empty (2)

cat_list (2)

v_s (2)

v (2)

b (2)

values (1)

value_targets (1)

advantages (1)

loss (1)

policy (1)

stack_ (1)

__repr__ (1)

info (1)

indice (1)

Méthodes fréquemment utilisées

values (1)

value_targets (1)

advantages (1)

loss (1)

policy (1)

stack_ (1)

__repr__ (1)

info (1)

indice (1)

Exemple #1

0

Afficher le fichier

def trj_sample(self, trj_num=None): if trj_num is None: indices = np.random.permutation(self.__len__()) else: assert trj_num <= self.__len__() indices = np.random.permutation(self.__len__())[:trj_num] batch_list = [self.__getitem__(i) for i in indices] batch = Batch() batch.cat_list(batch_list) #print(len(batch),batch.keys()) #print(aaa) return batch

Exemple #2

0

Afficher le fichier

def trj_by_policy(self,batch): #return batch assert len(batch) % self.trj_clip_steps == 0 infer_batch = None old_step_batch = None o_len = batch.act.o.shape[-1] policy_batch_list = [] for step in range(self.trj_clip_steps): indices = np.arange(step, len(batch), self.trj_clip_steps,) step_batch = batch[indices] if infer_batch is not None: #修正obs #print(step) #print(step_batch.obs.s[0]) s = torch.cat([old_step_batch.obs.s, infer_batch.act_m[:,o_len:].cpu().reshape(len(old_step_batch),1,-1)],1) s = s[:,1:,:] step_batch.obs.s = s #print(step_batch.obs.s[0]) del infer_batch infer_batch = self(step_batch) #修正act #print(step_batch.act) step_batch.act.a = infer_batch.act_d.cpu() step_batch.act.o = infer_batch.act_m[:,:o_len].contiguous().cpu() step_batch.act.s_next = infer_batch.act_m[:,o_len:].contiguous().cpu() #print(step_batch.act) old_step_batch = step_batch policy_batch_list.append(step_batch) policy_batch = Batch() policy_batch.cat_list(policy_batch_list) re_indices = [] for i in range(len(policy_batch_list[0])): for j in range(self.trj_clip_steps): re_indices.append(i + (j*len(policy_batch_list[0]))) re_indices = np.array(re_indices).astype(np.int32) policy_batch = policy_batch[re_indices] return policy_batch