Python AsrDictionary.finalize示例

编程语言: Python

命名空间/包名称: espresso.data

类/类型: AsrDictionary

方法/功能: finalize

hotexamples.com的示例: 4

Python AsrDictionary.finalize - 已找到4个示例。这些是从开源项目中提取的最受好评的espresso.data.AsrDictionary.finalize现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

load(5)

AsrDictionary(4)

finalize(4)

add_symbol(3)

pad(3)

space_index(3)

eos(2)

add_file_to_dictionary(1)

build_bpe(1)

index(1)

non_lang_syms(1)

space(1)

unk(1)

示例#1

显示文件

文件： language_modeling_for_asr.py 项目： medbar/espresso

    def build_dictionary(cls,
                         filenames,
                         workers=1,
                         threshold=-1,
                         nwords=-1,
                         padding_factor=8):
        """Build the dictionary

        Args:
            filenames (list): list of filenames
            workers (int): number of concurrent workers
            threshold (int): defines the minimum word count
            nwords (int): defines the total number of words in the final dictionary,
                including special symbols
            padding_factor (int): can be used to pad the dictionary size to be a
                multiple of 8, which is important on some hardware (e.g., Nvidia
                Tensor Cores).
        """
        d = AsrDictionary()
        for filename in filenames:
            AsrDictionary.add_file_to_dictionary(filename, d,
                                                 tokenizer.tokenize_line,
                                                 workers)
        d.finalize(threshold=threshold,
                   nwords=nwords,
                   padding_factor=padding_factor)
        return d

示例#2

显示文件

文件： test_asr_dataset.py 项目： vyraun/espresso

 def make_dictionary():
     """construct dictionary."""
     d = AsrDictionary()
     alphabet = string.ascii_lowercase
     for token in alphabet:
         d.add_symbol(token)
     d.add_symbol("<space>")
     d.finalize(padding_factor=1)  # don't add extra padding symbols
     d.space_index = d.indices.get("<space>", -1)
     return d

示例#3

显示文件

文件： test_speech_utils.py 项目： newhousewhite/espresso

 def make_dictionary(vocab, non_lang_syms=[]):
     """construct dictionary."""
     assert isinstance(vocab, list) and isinstance(non_lang_syms, list)
     d = AsrDictionary()
     for token in vocab:
         d.add_symbol(token)
     d.add_symbol('<space>')
     for token in non_lang_syms:
         d.add_symbol(token)
     d.finalize(padding_factor=1)  # don't add extra padding symbols
     d.space_index = d.indices.get('<space>', -1)
     return d

示例#4

显示文件

 def make_dictionary(vocab, non_lang_syms=[]):
     """construct dictionary."""
     assert isinstance(vocab, list) and isinstance(non_lang_syms, list)
     d = AsrDictionary()
     d.non_lang_syms = non_lang_syms
     args = Namespace(bpe="characters_asr")
     d.build_bpe(args)
     for token in vocab:
         d.add_symbol(token)
     d.add_symbol("<space>")
     for token in non_lang_syms:
         d.add_symbol(token)
     d.finalize(padding_factor=1)  # don't add extra padding symbols
     d.space_index = d.indices.get("<space>", -1)
     return d