Python print_as_bytes 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: opennmt.utils.misc

메소드/함수: print_as_bytes

hotexamples.com에서의 예제들: 9

Python print_as_bytes - 9개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 opennmt.utils.misc.print_as_bytes에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

 def print_prediction(self, prediction, params=None, stream=None):
     if params is None:
         params = {}
     with_scores = params.get("with_scores")
     alignment_type = params.get("with_alignments")
     if alignment_type and "alignment" not in prediction:
         raise ValueError(
             "with_alignments is set but the model did not return alignment information"
         )
     num_hypotheses = len(prediction["log_probs"])
     for i in range(num_hypotheses):
         if "tokens" in prediction:
             target_length = prediction["length"][i]
             tokens = prediction["tokens"][i][:target_length]
             sentence = self.labels_inputter.tokenizer.detokenize(tokens)
         else:
             sentence = prediction["text"][i]
         score = None
         attention = None
         if with_scores:
             score = prediction["log_probs"][i]
         if alignment_type:
             attention = prediction["alignment"][i][:target_length]
         sentence = misc.format_translation_output(
             sentence,
             score=score,
             attention=attention,
             alignment_type=alignment_type,
         )
         misc.print_as_bytes(sentence, stream=stream)

예제 #2

파일 보기

  def detokenize_stream(self, input_stream=sys.stdin, output_stream=sys.stdout, delimiter=" "):
    """Detokenizes a stream of sentences.

    Args:
      input_stream: The input stream.
      output_stream: The output stream.
      delimiter: The token delimiter used for text serialization.
    """
    for line in input_stream:
      tokens = line.strip().split(delimiter)
      string = self.detokenize(tokens)
      misc.print_as_bytes(string, stream=output_stream)

예제 #3

파일 보기

  def tokenize_stream(self, input_stream=sys.stdin, output_stream=sys.stdout, delimiter=" "):
    """Tokenizes a stream of sentences.

    Args:
      input_stream: The input stream.
      output_stream: The output stream.
      delimiter: The token delimiter to use for text serialization.
    """
    for line in input_stream:
      line = line.strip()
      tokens = self.tokenize(line)
      merged_tokens = delimiter.join(tokens)
      misc.print_as_bytes(merged_tokens, stream=output_stream)

예제 #4

파일 보기

 def print_score(self, score, params=None, stream=None):
     if params is None:
         params = {}
     length = score["length"]
     tokens = score["tokens"][:length]
     sentence = self.decoder_inputter.tokenizer.detokenize(tokens)
     token_level_scores = None
     attention = None
     if params.get("with_token_level"):
         token_level_scores = score["cross_entropy"][:length]
     if "attention" in score:
         attention = score["attention"][:length]
     alignment_type = params.get("with_alignments")
     sentence = misc.format_translation_output(
         sentence,
         score=score["score"],
         token_level_scores=token_level_scores,
         attention=attention,
         alignment_type=alignment_type)
     misc.print_as_bytes(sentence, stream=stream)

예제 #5

파일 보기

파일: tokenizer.py 프로젝트: KabyleAI/OpenNMT-tf

    def tokenize_stream(
        self,
        input_stream=sys.stdin,
        output_stream=sys.stdout,
        delimiter=" ",
        training=True,
    ):
        """Tokenizes a stream of sentences.

        Args:
          input_stream: The input stream.
          output_stream: The output stream.
          delimiter: The token delimiter to use for text serialization.
          training: Set to ``False`` to tokenize for inference.
        """
        for line in input_stream:
            line = line.strip()
            tokens = self.tokenize(line, training=training)
            merged_tokens = delimiter.join(tokens)
            misc.print_as_bytes(merged_tokens, stream=output_stream)

예제 #6

파일 보기

def _process_stream_as_dataset(
    input_stream,
    output_stream,
    map_func,
    batch_size=512,
    num_parallel_calls=4,
):
    dataset = tf.data.Dataset.from_generator(
        lambda: input_stream,
        output_types=tf.string,
        output_shapes=tf.TensorShape([]),
    )
    dataset = dataset.batch(batch_size)
    dataset = dataset.map(map_func, num_parallel_calls=num_parallel_calls)

    expected_spec = tf.TensorSpec(shape=[None], dtype=tf.string)
    if dataset.element_spec != expected_spec:
        raise TypeError(
            "Expected map_func to produce elements with spec %s, but got spec %s instead"
            % (expected_spec, dataset.element_spec))

    for lines in dataset.as_numpy_iterator():
        for line in lines:
            misc.print_as_bytes(line, stream=output_stream)

예제 #7

파일 보기

 def print_prediction(self, prediction, params=None, stream=None):
     misc.print_as_bytes(prediction["classes"], stream=stream)

예제 #8

파일 보기

파일: language_model.py 프로젝트: steremma/OpenNMT-tf

 def print_prediction(self, prediction, params=None, stream=None):
     target_length = prediction["length"]
     tokens = prediction["tokens"][:target_length]
     sentence = self.examples_inputter.tokenizer.detokenize(tokens)
     sentence = misc.format_translation_output(sentence)
     misc.print_as_bytes(sentence, stream=stream)

예제 #9

파일 보기

 def print_prediction(self, prediction, params=None, stream=None):
     tags = prediction["tags"][:prediction["length"]]
     sent = b" ".join(tags)
     misc.print_as_bytes(sent, stream=stream)