Python NerTagIndexer.tokens_to_indices示例

编程语言: Python

命名空间/包名称: allennlp.data.token_indexers

类/类型: NerTagIndexer

方法/功能: tokens_to_indices

hotexamples.com的示例: 5

Python NerTagIndexer.tokens_to_indices - 已找到5个示例。这些是从开源项目中提取的最受好评的allennlp.data.token_indexers.NerTagIndexer.tokens_to_indices现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

NerTagIndexer(13)

count_vocab_items(3)

tokens_to_indices(3)

pad_token_sequence(2)

as_padded_tensor(1)

as_padded_tensor_dict(1)

get_padding_lengths(1)

get_padding_token(1)

token_to_indices(1)

示例#1

显示文件

文件： ner_tag_indexer_test.py 项目： apmoore1/allennlp

 def test_tokens_to_indices_uses_ner_tags(self):
     tokens = self.tokenizer.split_words("Larry Page is CEO of Google.")
     tokens = [t for t in tokens] + [Token("</S>")]
     vocab = Vocabulary()
     person_index = vocab.add_token_to_namespace('PERSON', namespace='ner_tags')
     none_index = vocab.add_token_to_namespace('NONE', namespace='ner_tags')
     vocab.add_token_to_namespace('ORG', namespace='ner_tags')
     indexer = NerTagIndexer(namespace='ner_tags')
     assert indexer.tokens_to_indices([tokens[1]], vocab, "tokens1") == {"tokens1": [person_index]}
     assert indexer.tokens_to_indices([tokens[-1]], vocab, "tokens-1") == {"tokens-1": [none_index]}

示例#2

显示文件

文件： ner_tag_indexer_test.py 项目： danielkorat/allennlp-dm-parse-probs

 def test_tokens_to_indices_uses_ner_tags(self):
     tokens = self.tokenizer.split_words("Larry Page is CEO of Google.")
     tokens = [t for t in tokens] + [Token("</S>")]
     vocab = Vocabulary()
     person_index = vocab.add_token_to_namespace("PERSON", namespace="ner_tags")
     none_index = vocab.add_token_to_namespace("NONE", namespace="ner_tags")
     vocab.add_token_to_namespace("ORG", namespace="ner_tags")
     indexer = NerTagIndexer(namespace="ner_tags")
     assert indexer.tokens_to_indices([tokens[1]], vocab, "tokens1") == {
         "tokens1": [person_index]
     }
     assert indexer.tokens_to_indices([tokens[-1]], vocab, "tokens-1") == {
         "tokens-1": [none_index]
     }

示例#3

显示文件

文件： ner_tag_indexer_test.py 项目： ryan-leung/ml_monorepo

 def test_tokens_to_indices_uses_ner_tags(self):
     tokens = self.tokenizer.split_words(u"Larry Page is CEO of Google.")
     tokens = [t for t in tokens] + [Token(u"</S>")]
     vocab = Vocabulary()
     person_index = vocab.add_token_to_namespace(u'PERSON',
                                                 namespace=u'ner_tags')
     none_index = vocab.add_token_to_namespace(u'NONE',
                                               namespace=u'ner_tags')
     vocab.add_token_to_namespace(u'ORG', namespace=u'ner_tags')
     indexer = NerTagIndexer()
     assert indexer.tokens_to_indices([tokens[1]], vocab, u"tokens1") == {
         u"tokens1": [person_index]
     }
     assert indexer.tokens_to_indices([tokens[-1]], vocab, u"tokens-1") == {
         u"tokens-1": [none_index]
     }

示例#4

显示文件

文件： ner_tag_indexer_test.py 项目： danielkorat/allennlp-dm-parse-probs

 def test_blank_ner_tag(self):
     tokens = [
         Token(token)._replace(ent_type_="") for token in "allennlp is awesome .".split(" ")
     ]
     indexer = NerTagIndexer()
     counter = defaultdict(lambda: defaultdict(int))
     for token in tokens:
         indexer.count_vocab_items(token, counter)
     # spacy uses a empty string to indicate "no NER tag"
     # we convert it to "NONE"
     assert counter["ner_tokens"]["NONE"] == 4
     vocab = Vocabulary(counter)
     none_index = vocab.get_token_index("NONE", "ner_tokens")
     # should raise no exception
     indices = indexer.tokens_to_indices(tokens, vocab, index_name="ner")
     assert {"ner": [none_index, none_index, none_index, none_index]} == indices

示例#5

显示文件

文件： ner_tag_indexer_test.py 项目： apmoore1/allennlp

 def test_blank_ner_tag(self):
     tokens = [Token(token) for token in "allennlp is awesome .".split(" ")]
     for token in tokens:
         token.ent_type_ = ""
     indexer = NerTagIndexer()
     counter = defaultdict(lambda: defaultdict(int))
     for token in tokens:
         indexer.count_vocab_items(token, counter)
     # spacy uses a empty string to indicate "no NER tag"
     # we convert it to "NONE"
     assert counter["ner_tokens"]["NONE"] == 4
     vocab = Vocabulary(counter)
     none_index = vocab.get_token_index('NONE', 'ner_tokens')
     # should raise no exception
     indices = indexer.tokens_to_indices(tokens, vocab, index_name="ner")
     assert {"ner": [none_index, none_index, none_index, none_index]} == indices