Python BertDictionary示例

编程语言: Python

命名空间/包名称: fairseq.data.masked_lm_dictionary

类/类型: BertDictionary

hotexamples.com的示例: 4

Python BertDictionary - 已找到4个示例。这些是从开源项目中提取的最受好评的fairseq.data.masked_lm_dictionary.BertDictionary现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

load(3)

BertDictionary(1)

finalize(1)

示例#1

显示文件

文件： masked_lm.py 项目： mazi-hou/stochastic-beam-search

 def build_dictionary(cls,
                      filenames,
                      workers=1,
                      threshold=-1,
                      nwords=-1,
                      padding_factor=8):
     d = BertDictionary()
     for filename in filenames:
         Dictionary.add_file_to_dictionary(filename, d,
                                           tokenizer.tokenize_line, workers)
     d.finalize(threshold=threshold,
                nwords=nwords,
                padding_factor=padding_factor)
     return d

示例#2

显示文件

文件： bert_tensorizer.py 项目： ufukhurriyetoglu/pytext

 def from_config(cls, config: Config, **kwargs):
     tokenizer = create_component(ComponentType.TOKENIZER, config.tokenizer)
     replacements = {
         config.unk_token: UNK,
         config.pad_token: PAD,
         config.bos_token: BOS,
         config.eos_token: EOS,
         config.mask_token: MASK,
     }
     if isinstance(tokenizer, WordPieceTokenizer):
         vocab = Vocabulary(
             [token for token, _ in tokenizer.vocab.items()],
             replacements=replacements,
         )
     else:
         dictionary = BertDictionary.load(config.vocab_file)
         vocab = Vocabulary(
             dictionary.symbols, dictionary.count, replacements=replacements
         )
     return cls(
         columns=config.columns,
         tokenizer=tokenizer,
         add_bos_token=config.add_bos_token,
         add_eos_token=config.add_eos_token,
         use_eos_token_for_bos=config.use_eos_token_for_bos,
         max_seq_len=config.max_seq_len,
         vocab=vocab,
         **kwargs,
     )

示例#3

显示文件

    def setup_task(cls, args, **kwargs):
        """Setup the task.
        """
        paths = args.data.split(':')
        assert len(paths) > 0
        dictionary = BertDictionary.load(os.path.join(paths[0], 'dict.txt'))
        print('| dictionary: {} types'.format(len(dictionary)))

        return cls(args, dictionary)

示例#4

显示文件

 def load_dictionary(cls, filename):
     return BertDictionary.load(filename)