Esempi in Python per Vocab.add_word

Linguaggio di programmazione: Python

Spazio dei nomi/nome del pacchetto: utils.vocab

Classe/tipologia: Vocab

Metodo/funzione: add_word

Esempi su hotexamples.com: 5

Vocab.add_word in Python: 5 esempi trovati. Questi sono i migliori esempi reali in Python per utils.vocab.Vocab.add_word, estratti da progetti open source. Li puoi valutare, per aiutarci a migliorare la qualità dei nostri esempi.

Metodi utilizzati di frequente

Mostra Nascondi

Vocab(30)

load(22)

add(10)

from_file(8)

save(7)

add_word(5)

add_tokenized_sentence(3)

tokens2ids(3)

size(3)

tokens2indices(3)

finish(3)

set_freeze(2)

extend(2)

token2id(2)

process(2)

load_pretrained_emb(2)

__dict__(2)

get_freeze(2)

__get_index__(2)

__get_word__(2)

__len__(2)

build_vocab(2)

encode_sequence_batch(1)

build(1)

unmap(1)

top_words(1)

add_documents(1)

add_pad_token(1)

sequence_2_id(1)

add_unk_token(1)

randomly_init_embeddings(1)

add_words(1)

load_vocab(1)

load_from_pickle(1)

embeddings(1)

load_from_file(1)

load_embeddings(1)

inst2idx(1)

init_embed(1)

get_token(1)

get_size(1)

get_index(1)

contains(1)

from_iterable(1)

convert_tokens_to_ids(1)

create(1)

filter_tokens_by_cnt(1)

word_2_id(1)

Esempio n. 1

Mostra file

File: preprocessors.py Progetto: hiroki13/span-based-srl

    def make_vocab_label(self,
                         sents,
                         vocab_label_init=None):
        if len(sents) == 0:
            return None

        if vocab_label_init:
            vocab_label = deepcopy(vocab_label_init)
        else:
            vocab_label = Vocab()
            none_label = 'O'
            vocab_label.add_word(none_label)

        labels = []
        for sent in sents:
            if sent.has_prds:
                for prop in sent.prd_bio_labels:
                    labels += prop
        cnt = Counter(labels)
        labels = [(w, c) for w, c in cnt.most_common()]

        for label, count in labels:
            vocab_label.add_word(label)

        return vocab_label

Esempio n. 2

Mostra file

File: preprocessors.py Progetto: hiroki13/span-based-srl

    def make_vocab_label(self,
                         sents,
                         vocab_label_init=None):
        if len(sents) == 0:
            return None

        if vocab_label_init:
            vocab_label = deepcopy(vocab_label_init)
        else:
            vocab_label = Vocab()
            if self.argv.data_type == 'conll05':
                core_labels = ["A0", "A1", "A2", "A3", "A4", "A5"]
            else:
                core_labels = ["ARG0", "ARG1", "ARG2", "ARG3", "ARG4", "ARG5"]
            for label in core_labels:
                vocab_label.add_word(label)

        bio_labels = []
        for sent in sents:
            for props in sent.prd_bio_labels:
                bio_labels += props
        cnt = Counter(bio_labels)
        bio_labels = [(w, c) for w, c in cnt.most_common()]

        for label, count in bio_labels:
            if not label.endswith('-V') and len(label) > 1:
                vocab_label.add_word(label[2:])

        return vocab_label

Esempio n. 3

Mostra file

missing_ratio = round((1.0 * missing_words / len(word_counts)) * 100, 4)

print('Number of words missing from GloVe:', missing_words)
print('Percent of words that are missing from vocabulary: {}%'.format(
    missing_ratio))

# Limit the vocab that we will use to words that appear >= threshold or are in GloVe
vocab = Vocab()

# Dictionary to convert words to integers
threshold = 10

for word, count in word_counts.items():
    if count >= threshold or word in glove_embeddings:
        vocab.add_word(word)

# Special tokens that will be added to our vocab
codes = ["<UNK>", "<EOS>", "<GO>", "<PAD>"]

# Add codes to vocab
for code in codes:
    vocab.add_word(code)

usage_ratio = round(1.0 * len(vocab) / len(word_counts) + 4, 4) * 100

print("Total number of unique words:", len(word_counts))
print("Number of words we will use:", len(vocab))
print("Percent of words we will use: {}%".format(usage_ratio))

# save vocabulary

Esempio n. 4

Mostra file

File: preprocessors.py Progetto: hiroki13/span-based-srl

 def make_vocab_word(word_list):
     vocab_word = Vocab()
     vocab_word.add_word(UNK)
     for w in word_list:
         vocab_word.add_word(w)
     return vocab_word

Esempio n. 5

Mostra file

File: misc.py Progetto: angelotran05/span-based-srl

def make_vocab_from_ids(key_value_format):
    vocab = Vocab()
    for key, value in key_value_format:
        vocab.add_word(key)
    return vocab