예제 #1
0
 def _make_examples(self, sentences):
   word_vocab = embeddings.get_word_vocab(self.config)
   char_vocab = embeddings.get_char_vocab()
   return [
       example.Example(sentence, word_vocab, char_vocab)
       for sentence in sentences
   ]
예제 #2
0
 def _make_examples(self, sentences):
   word_vocab = embeddings.get_word_vocab(self.config)
   char_vocab = embeddings.get_char_vocab()
   return [
       example.Example(sentence, word_vocab, char_vocab)
       for sentence in sentences
   ]
예제 #3
0
 def _get_examples(self, split):
     word_vocab = embeddings.get_word_vocab(self._config)
     char_vocab = embeddings.get_char_vocab()
     examples = [
         SentenceClassificationExample(self._config, words, tag, word_vocab,
                                       char_vocab, self.label_mapping,
                                       self._task_name)
         for words, tag in self.get_labeled_sentences(split)
     ]
     return examples
예제 #4
0
 def _get_examples(self, split):
   word_vocab = embeddings.get_word_vocab(self._config)
   word_vocab_vi = embeddings.get_word_vocab_vi(self._config)
   char_vocab = embeddings.get_char_vocab()
   examples = [
       TranslationExample(
           self._config, words_src, words_tgt, size_src, size_tgt,
           word_vocab, char_vocab, self._task_name, word_vocab_vi, split)
       for words_src, words_tgt, size_src, size_tgt in self.get_sentence_tuples(split)
   ]
   return examples
예제 #5
0
 def _get_examples(self, split):
   word_vocab = embeddings.get_word_vocab(self._config)
   char_vocab = embeddings.get_char_vocab()
   examples = [
       TaggingExample(
           self._config, self._is_token_level, words, tags,
           word_vocab, char_vocab, self.label_mapping, self._task_name)
       for words, tags in self.get_labeled_sentences(split)]
   if self._config.train_set_percent < 100:
     utils.log('using reduced train set ({:}%)'.format(
         self._config.train_set_percent))
     random.shuffle(examples)
     examples = examples[:int(len(examples) *
                              self._config.train_set_percent / 100.0)]
   return examples
예제 #6
0
 def _get_examples(self, split):
   word_vocab = embeddings.get_word_vocab(self._config)
   char_vocab = embeddings.get_char_vocab()
   examples = [
       TaggingExample(
           self._config, self._is_token_level, words, tags,
           word_vocab, char_vocab, self.label_mapping, self._task_name)
       for words, tags in self.get_labeled_sentences(split)]
   if self._config.train_set_percent < 100:
     utils.log('using reduced train set ({:}%)'.format(
         self._config.train_set_percent))
     random.shuffle(examples)
     examples = examples[:int(len(examples) *
                              self._config.train_set_percent / 100.0)]
   return examples
예제 #7
0
  def get_examples_translate(config, src, split):
    words_src = src.strip().split()
    size_src = len(words_src)
    words_tgt = []
    size_tgt = 1

    word_vocab = embeddings.get_word_vocab(config)
    word_vocab_vi = embeddings.get_word_vocab_vi(config)
    char_vocab = embeddings.get_char_vocab()

    examples = [
      TranslationExample(
        config, words_src, words_tgt, size_src, size_tgt,
        word_vocab, char_vocab, 'translate', word_vocab_vi, split)
    ]

    return examples