Python PunctuatorInput 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: lingvo.tasks.punctuator.input_generator

메소드/함수: PunctuatorInput

hotexamples.com에서의 예제들: 4

Python PunctuatorInput - 4개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 lingvo.tasks.punctuator.input_generator.PunctuatorInput에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: input_generator_test.py 프로젝트: zy1620454507/lingvo

  def testSourceTargetValues(self):
    max_length = 50
    p = self._CreatePunctuatorInputParams()
    with self.session(use_gpu=False) as sess:
      inp = input_generator.PunctuatorInput(p)
      tokenizer = inp.tokenizer_dict['default']

      fetched = py_utils.NestedMap(sess.run(inp.GetPreprocessedInputBatch()))
      source_ids = fetched.src.ids
      tgt_ids = fetched.tgt.ids
      tgt_labels = fetched.tgt.labels

      expected_ref = ('His approach was inquisitive , a meeting of artful '
                      'hesitation with fluid technique .')

      normalized_ref = expected_ref.lower().translate(None, string.punctuation)
      normalized_ref = ' '.join(normalized_ref.split())
      _, expected_src_ids, _ = sess.run(
          tokenizer.StringsToIds(
              tf.convert_to_tensor([normalized_ref]), max_length=max_length))
      expected_tgt_ids, expected_tgt_labels, _ = sess.run(
          tokenizer.StringsToIds(
              tf.convert_to_tensor([expected_ref]), max_length=max_length))

      self.assertAllEqual(expected_src_ids[0], source_ids[0, :max_length])
      self.assertAllEqual(expected_tgt_ids[0], tgt_ids[0, :max_length])
      self.assertAllEqual(expected_tgt_labels[0], tgt_labels[0, :max_length])

예제 #2

파일 보기

파일: input_generator_test.py 프로젝트: tensorflow/lingvo

    def testSourceTargetValues(self):
        max_length = 50
        p = self._CreatePunctuatorInputParams()
        with self.session(use_gpu=False):
            inp = input_generator.PunctuatorInput(p)

            fetched = py_utils.NestedMap(
                self.evaluate(inp.GetPreprocessedInputBatch()))
            source_ids = fetched.src.ids
            tgt_ids = fetched.tgt.ids
            tgt_labels = fetched.tgt.labels

            expected_ref = (
                b'Elk calling -- a skill that hunters perfected long ago to lure '
                b'game with the promise of a little romance -- is now its own sport .'
            )

            normalized_ref = expected_ref.lower().translate(
                None, string.punctuation.encode('utf-8'))
            normalized_ref = b' '.join(normalized_ref.split())
            _, expected_src_ids, _ = self.evaluate(
                inp.tokenizer.StringsToIds(tf.convert_to_tensor(
                    [normalized_ref]),
                                           max_length=max_length))
            expected_tgt_ids, expected_tgt_labels, _ = self.evaluate(
                inp.tokenizer.StringsToIds(tf.convert_to_tensor([expected_ref
                                                                 ]),
                                           max_length=max_length))

            self.assertAllEqual(expected_src_ids[0],
                                source_ids[0, :max_length])
            self.assertAllEqual(expected_tgt_ids[0], tgt_ids[0, :max_length])
            self.assertAllEqual(expected_tgt_labels[0],
                                tgt_labels[0, :max_length])

예제 #3

파일 보기

파일: input_generator_test.py 프로젝트: zy1620454507/lingvo

 def testBasic(self):
   p = self._CreatePunctuatorInputParams()
   with self.session(use_gpu=False) as sess:
     inp = input_generator.PunctuatorInput(p)
     # Runs a few steps.
     for _ in range(10):
       sess.run(inp.GetPreprocessedInputBatch())

예제 #4

파일 보기

    def testSourceTargetValues(self):
        max_length = 50
        p = self._CreatePunctuatorInputParams()
        with self.session(use_gpu=False) as sess:
            inp = input_generator.PunctuatorInput(p)
            tokenizer = inp.tokenizer_dict['default']

            fetched = py_utils.NestedMap(
                sess.run(inp.GetPreprocessedInputBatch()))
            source_ids = fetched.src.ids
            tgt_ids = fetched.tgt.ids
            tgt_labels = fetched.tgt.labels

            expected_ref = 'The internet is sort-of-40 this year .'

            # "the internet is sortof40 this year" - lower-case, no dashes, no dot.
            normalized_ref = expected_ref.lower().translate(
                None, string.punctuation)
            expected_src_ids, _, _ = sess.run(
                tokenizer.StringsToIds([normalized_ref],
                                       max_length=max_length))
            expected_tgt_ids, expected_tgt_labels, _ = sess.run(
                tokenizer.StringsToIds([expected_ref], max_length=max_length))

            self.assertAllEqual(expected_src_ids[0],
                                source_ids[0, :max_length])
            self.assertAllEqual(expected_tgt_ids[0], tgt_ids[0, :max_length])
            self.assertAllEqual(expected_tgt_labels[0],
                                tgt_labels[0, :max_length])