Python Batch Beispiele

Programmiersprache: Python

Namespace / Paketname: texar.torch.data.data.dataset_utils

Klasse / Typ: Batch

Beispiele auf hotexamples.com: 10

Python Batch - 10 Beispiele gefunden. Dies sind die am besten bewerteten Python Beispiele für die texar.torch.data.data.dataset_utils.Batch, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

Batch(10)

Häufig verwendete Methoden

Batch (10)

Beispiel #1

Datei anzeigen

Datei: mono_text_data.py Projekt: charlestaylorstella/transformer_dialog

    def collate(self, examples: List[List[str]]) -> Batch:
        # For `MonoTextData`, each example is represented as a list of strings.
        # `_collate` takes care of padding and numericalization.

        # If `pad_length` is `None`, pad to the longest sentence in the batch.
        text_ids = [
            self._vocab.map_tokens_to_ids_py(sent) for sent in examples
        ]
        text_ids, lengths = padded_batch(text_ids,
                                         self._pad_length,
                                         pad_value=self._vocab.pad_token_id)
        # Also pad the examples
        pad_length = self._pad_length or max(lengths)
        examples = [
            sent + [''] *
            (pad_length - len(sent)) if len(sent) < pad_length else sent
            for sent in examples
        ]

        text_ids = torch.from_numpy(text_ids)
        lengths = torch.tensor(lengths, dtype=torch.long)
        batch = {
            self.text_name: examples,
            self.text_id_name: text_ids,
            self.length_name: lengths
        }
        return Batch(len(examples), batch=batch)

Beispiel #2

Datei anzeigen

Datei: multi_aligned_data.py Projekt: yesxiaoyu/texar-pytorch

 def collate(self, examples) -> Batch:
     transposed_examples = map(list, zip(*examples))
     batch: Dict[str, Any] = {}
     for i, transposed_example in enumerate(transposed_examples):
         kth_batch = self._databases[i].collate(transposed_example)
         for key, name in self._names[i].items():
             batch.update({name: kth_batch[key]})
     return Batch(len(examples), batch=batch)

Beispiel #3

Datei anzeigen

Datei: data_iterators.py Projekt: hunterhector/texar-pytorch

def move_memory(data, device):
    def _move_fn(x):
        if isinstance(x, torch.Tensor):
            return x.to(device=device, non_blocking=True)
        return x

    if isinstance(data, Batch):
        return Batch(len(data), batch={
            key: map_structure(_move_fn, value)
            for key, value in data.items()
        })
    return map_structure(_move_fn, data)

Beispiel #4

Datei anzeigen

Datei: large_file_test.py Projekt: DrSnowbird/texar-pytorch-docker

 def collate(self, examples: List[Example]) -> Batch:
     src_pad_length = max(len(src) for src, _ in examples)
     tgt_pad_length = max(len(tgt) for _, tgt in examples)
     batch_size = len(examples)
     src_indices = np.zeros((batch_size, src_pad_length), dtype=np.int64)
     tgt_indices = np.zeros((batch_size, tgt_pad_length), dtype=np.int64)
     for b_idx, (src, tgt) in enumerate(examples):
         src_indices[b_idx, :len(src)] = src
         tgt_indices[b_idx, :len(tgt)] = tgt
     src_indices = torch.from_numpy(src_indices).to(device=self.device)
     tgt_indices = torch.from_numpy(tgt_indices).to(device=self.device)
     return Batch(batch_size, src=src_indices, tgt=tgt_indices)

Beispiel #5

Datei anzeigen

Datei: paired_text_data.py Projekt: DrSnowbird/texar-pytorch-docker

    def collate(self, examples: List[Tuple[List[str], List[str]]]) -> Batch:
        # For `PairedTextData`, each example is represented as a tuple of list
        # of strings.
        # `_collate` takes care of padding and numericalization.

        # If `pad_length` is `None`, pad to the longest sentence in the batch.
        src_examples = [example[0] for example in examples]
        source_ids = [
            self._src_vocab.map_tokens_to_ids_py(sent) for sent in src_examples
        ]
        source_ids, source_lengths = \
            padded_batch(source_ids,
                         self._src_pad_length,
                         pad_value=self._src_vocab.pad_token_id)
        src_pad_length = self._src_pad_length or max(source_lengths)
        src_examples = [
            sent + [''] * (src_pad_length - len(sent))
            if len(sent) < src_pad_length else sent for sent in src_examples
        ]

        source_ids = torch.from_numpy(source_ids).to(device=self.device)
        source_lengths = torch.tensor(source_lengths,
                                      dtype=torch.long,
                                      device=self.device)

        tgt_examples = [example[1] for example in examples]
        target_ids = [
            self._tgt_vocab.map_tokens_to_ids_py(sent) for sent in tgt_examples
        ]
        target_ids, target_lengths = \
            padded_batch(target_ids,
                         self._tgt_pad_length,
                         pad_value=self._tgt_vocab.pad_token_id)
        tgt_pad_length = self._tgt_pad_length or max(target_lengths)
        tgt_examples = [
            sent + [''] * (tgt_pad_length - len(sent))
            if len(sent) < tgt_pad_length else sent for sent in tgt_examples
        ]

        target_ids = torch.from_numpy(target_ids).to(device=self.device)
        target_lengths = torch.tensor(target_lengths,
                                      dtype=torch.long,
                                      device=self.device)

        return Batch(len(examples),
                     source_text=src_examples,
                     source_text_ids=source_ids,
                     source_length=source_lengths,
                     target_text=tgt_examples,
                     target_text_ids=target_ids,
                     target_length=target_lengths)

Beispiel #6

Datei anzeigen

 def collate(self, examples: List[Dict[str, Any]]) -> Batch:
     batch = {}
     for key, descriptor in self._features.items():
         values = [ex[key] for ex in examples]
         if descriptor.collate_method is not CollateMethod.List:
             # NumPy functions work on PyTorch tensors too.
             if descriptor.collate_method is CollateMethod.StackedTensor:
                 values = np.stack(values, axis=0)
             else:  # padded_tensor
                 values, _ = padded_batch(values)
             if (not isinstance(values, torch.Tensor)
                     and descriptor.dtype not in [np.str_, np.bytes_]):
                 values = torch.from_numpy(values)
         else:
             # Just put everything in a Python list.
             pass
         batch[key] = values
     return Batch(len(examples), batch)

Beispiel #7

Datei anzeigen

 def collate(self, examples: List[Dict[str, Any]]) -> Batch:
     batch = {}
     for key, descriptor in self._features.items():
         values = [ex[key] for ex in examples]
         if descriptor.shape is not None:
             # FixedLenFeature, do not pad.
             # NumPy functions work on PyTorch tensors too.
             if len(descriptor.shape) > 0 and descriptor.shape[0] is None:
                 values, _ = padded_batch(values)
             else:
                 values = np.stack(values, axis=0)
             if (not isinstance(values, torch.Tensor)
                     and descriptor.dtype not in [np.str_, np.bytes_]):
                 values = torch.from_numpy(values)
         else:
             # VarLenFeature, just put everything in a Python list.
             pass
         batch[key] = values
     return Batch(len(examples), batch)

Beispiel #8

Datei anzeigen

Datei: data_iterators_test.py Projekt: swapnull7/texar-pytorch

 def collate(self, examples: List[Example]) -> Batch:
     numbers = np.asarray([ex[0] for ex in examples])
     strings = np.asarray([ex[1] for ex in examples])
     return Batch(len(numbers), numbers=numbers, strings=strings)

Beispiel #9

Datei anzeigen

Datei: data_iterators_test.py Projekt: swapnull7/texar-pytorch

 def collate(self, examples):
     return Batch(len(examples), text=examples)

Beispiel #10

Datei anzeigen

 def collate(self, examples: List[Union[int, float]]) -> Batch:
     # convert the list of strings into appropriate tensors here
     examples_np = np.array(examples, dtype=self._to_data_type)
     collated_examples = torch.from_numpy(examples_np).to(device=self.device)
     return Batch(len(examples),
                  batch={self.data_name: collated_examples})