Python Vocab.pickle Exemples

Langage de programmation: Python

Espace de nommage/Pack: utils

Class/Type: Vocab

Méthode/Fonction: pickle

Exemples au hotexamples.com: 3

Python Vocab.pickle - 3 exemples trouvés. Ce sont les exemples réels les mieux notés de utils.Vocab.pickle extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

encode(30)

construct(30)

load(15)

Vocab(9)

add_word(6)

to_input_tensor(4)

get_word_list(3)

pickle(3)

decode(3)

get_train_dev_test(3)

get_pre_trained_examples(2)

build_vocab(2)

add_dataframe(2)

save_to_file(2)

add(2)

add_special_token(2)

update(2)

build_bert_vocab(2)

build(2)

add_words(2)

add_special_tokens(2)

build_embedding_matrix(2)

word2id(1)

get_wv(1)

id2word(1)

indices2tokens(1)

transform(1)

_looking_up(1)

load_pretrained_char_embeddings(1)

load_pretrained_word_embeddings(1)

py_size(1)

randomly_init_py_embeddings(1)

size(1)

add_char(1)

filter_pys_by_cnt(1)

get_vocab(1)

construct_phrase(1)

add_list(1)

add_py(1)

build_from_counter(1)

char_size(1)

check_words(1)

construct_batch(1)

convert_to_str(1)

getIndex(1)

decode_docs(1)

emb_wordtoindex(1)

__len__(1)

filter_chars_by_cnt(1)

filter_tokens_by_cnt(1)

Méthodes fréquemment utilisées

encode (30)

construct (30)

load (15)

Vocab (9)

add_word (6)

to_input_tensor (4)

get_word_list (3)

pickle (3)

decode (3)

get_train_dev_test (3)

Méthodes fréquemment utilisées

get_pre_trained_examples (2)

build_vocab (2)

add_dataframe (2)

save_to_file (2)

add (2)

add_special_token (2)

update (2)

build_bert_vocab (2)

build (2)

add_words (2)

add_special_tokens (2)

build_embedding_matrix (2)

word2id (1)

get_wv (1)

id2word (1)

indices2tokens (1)

transform (1)

_looking_up (1)

load_pretrained_char_embeddings (1)

load_pretrained_word_embeddings (1)

Méthodes fréquemment utilisées

add_special_tokens (2)

build_embedding_matrix (2)

word2id (1)

get_wv (1)

id2word (1)

indices2tokens (1)

transform (1)

_looking_up (1)

load_pretrained_char_embeddings (1)

load_pretrained_word_embeddings (1)

py_size (1)

randomly_init_py_embeddings (1)

size (1)

add_char (1)

filter_pys_by_cnt (1)

get_vocab (1)

construct_phrase (1)

add_list (1)

add_py (1)

build_from_counter (1)

char_size (1)

check_words (1)

construct_batch (1)

convert_to_str (1)

getIndex (1)

decode_docs (1)

emb_wordtoindex (1)

__len__ (1)

filter_chars_by_cnt (1)

filter_tokens_by_cnt (1)

Méthodes fréquemment utilisées

py_size (1)

randomly_init_py_embeddings (1)

size (1)

add_char (1)

filter_pys_by_cnt (1)

get_vocab (1)

construct_phrase (1)

add_list (1)

add_py (1)

build_from_counter (1)

char_size (1)

check_words (1)

construct_batch (1)

convert_to_str (1)

getIndex (1)

decode_docs (1)

emb_wordtoindex (1)

__len__ (1)

filter_chars_by_cnt (1)

filter_tokens_by_cnt (1)

fit (1)

from_corpus (1)

word_size (1)

Exemple #1

0

Afficher le fichier

Fichier : prepare_data.py Projet : xuandif-cmu/dialogue-hred-vhred

('test', test)]: print(f'Processing {split_type} dataset...') split_data_dir = datasets_dir.joinpath(split_type) split_data_dir.mkdir(exist_ok=True) conversation_length = [ min(len(conv), max_conv_len) for conv in conversations ] sentences, sentence_length = pad_sentences( conversations, max_sentence_length=max_sent_len, max_conversation_length=max_conv_len) print('Saving preprocessed data at', split_data_dir) to_pickle(conversation_length, split_data_dir.joinpath('conversation_length.pkl')) to_pickle(sentences, split_data_dir.joinpath('sentences.pkl')) to_pickle(sentence_length, split_data_dir.joinpath('sentence_length.pkl')) if split_type != 'test': print('Save Vocabulary...') vocab.add_dataframe(conversations) vocab.update(max_size=max_vocab_size, min_freq=min_freq) print('Vocabulary size: ', len(vocab)) vocab.pickle(datasets_dir.joinpath('word2id.pkl'), datasets_dir.joinpath('id2word.pkl')) print('Done!')

Exemple #2

0

Afficher le fichier

sentences, sentence_length = pad_sentences( conversations, max_sentence_length=max_sent_len, max_conversation_length=max_conv_len) print('Saving preprocessed data at', split_data_dir) to_pickle(conversation_length, split_data_dir.joinpath('conversation_length.pkl')) to_pickle(sentences, split_data_dir.joinpath('sentences.pkl')) to_pickle(sentence_length, split_data_dir.joinpath('sentence_length.pkl')) to_pickle(emotions, split_data_dir.joinpath('labels.pkl')) if split_type == 'train': print('Save Vocabulary...') vocab = Vocab(tokenizer) vocab.add_dataframe(conversations) assert(GLOVE_DIR != "") vocab.update(GLOVE_DIR, max_size=max_vocab_size, min_freq=min_freq) print('Vocabulary size: ', len(vocab)) vocab.pickle(dailydialog_dir.joinpath('word2id.pkl'), dailydialog_dir.joinpath('id2word.pkl'), dailydialog_dir.joinpath('word_emb.pkl')) print('Done!')

Exemple #3

0

Afficher le fichier

sentences, sentence_length = pad_sentences( conv_sentences, max_sentence_length=max_sent_len, max_conversation_length=max_conv_len) for sentence_len, label in zip(conversation_length, conv_labels): assert(sentence_len ==len(label)) print('Saving preprocessed data at', split_data_dir) to_pickle(conversation_length, split_data_dir.joinpath( 'conversation_length.pkl')) to_pickle(sentences, split_data_dir.joinpath('sentences.pkl')) to_pickle(conv_labels, split_data_dir.joinpath('labels.pkl')) to_pickle(sentence_length, split_data_dir.joinpath( 'sentence_length.pkl')) to_pickle(iemocap.vids[split_type], split_data_dir.joinpath('video_id.pkl')) if split_type == 'train': print('Save Vocabulary...') vocab = Vocab(tokenizer) vocab.add_dataframe(conv_sentences) assert(GLOVE_DIR != "") vocab.update(GLOVE_DIR, max_size=max_vocab_size, min_freq=min_freq) print('Vocabulary size: ', len(vocab)) vocab.pickle(iemocap_dir.joinpath('word2id.pkl'), iemocap_dir.joinpath('id2word.pkl'), iemocap_dir.joinpath('word_emb.pkl'))