Python Vocabulary.add_from_fileの例

プログラミング言語: Python

名前空間/パッケージ名: vocabulary

クラス/型: Vocabulary

メソッド/関数: add_from_file

hotexamples.comのコード掲載数: 2

Python Vocabulary.add_from_file - 2件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのvocabulary.Vocabulary.add_from_fileの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

Vocabulary(30)

add_word(15)

clean_text(8)

build_vocab(8)

add_words(8)

deserialize(7)

compile(4)

add(4)

antonym(4)

auto_punctuate(3)

add_token(3)

encode(3)

add_from_file(2)

decode_output(2)

getUniGrams(2)

from_documents(2)

build_corpus(2)

getVocabularyByDocument(2)

getBiGrams(2)

get_id_from_token(2)

add_a_word(2)

add_text(2)

add_many(2)

getFullDict(2)

gen_DAG(1)

from_text_files(1)

from_text(1)

from_serializable(1)

from_sentences(1)

get(1)

add_constant(1)

getPTStopWords(1)

getQuestions(1)

getVocabularySize(1)

get_all_source_words(1)

get_all_translations(1)

get_pos(1)

get_term_text(1)

make_dictionary(1)

seg_content(1)

from_nlp_data(1)

encode_sent(1)

from_idx2word_dict(1)

convert_sentence(1)

add_new_word(1)

add_sentence(1)

add_chunk(1)

add_word_lst(1)

append(1)

build(1)

コード例 #1

ファイルを表示

def main(unused):
    parser = argparse.ArgumentParser()
    parser.add_argument("embedding_path")
    parser.add_argument("vocabulary_dir")
    parser.add_argument("--training_dir")
    parser.add_argument("--validation_dir")
    parser.add_argument("--decode_dir")
    parser.add_argument("--decode_out_dir")
    parser.add_argument("--mode",
                        choices=["train", "validate", "decode"],
                        default="train")
    parser.add_argument("--logdir")
    parser.add_argument("--batch_size", type=int, default=30)
    parser.add_argument("--validation_interval", type=int, default=20000)
    parser.add_argument("--beam_width", type=int, default=5)
    parser.add_argument("--max_output_length", type=int, default=32)
    parser.add_argument("--target_vocabulary_size", type=int, default=20000)
    parser.add_argument("--synthetic", action="store_true")
    parser.add_argument("--allow_gpu_growth", action="store_true")
    parser.add_argument("--collect_run_metadata", action="store_true")
    parser.add_argument("--log_weight_images", action="store_true")
    options = parser.parse_args()

    if options.mode == "decode":
        # Batching not supported in decoding
        options.batch_size = 1

    embedding_words, word_dict, word_embedding_dim = load_word_embeddings(
        options.embedding_path)

    vocabulary = Vocabulary()

    summary_vocabulary_path = path.join(options.vocabulary_dir,
                                        "summary_vocabulary.txt")

    vocabulary.add_from_file(
        summary_vocabulary_path,
        options.target_vocabulary_size - len(vocabulary.words))

    document_vocabulary_path = path.join(options.vocabulary_dir,
                                         "document_vocabulary.txt")

    # Add the most common words from vocabulary
    vocabulary.add_from_file(document_vocabulary_path, 150000)

    # Add additional common words from loaded embeddings
    # note that embedding_words contains 2D numpy arrays
    vocabulary.add_words(embedding_words[:100000])

    run(options, word_dict, word_embedding_dim, vocabulary)

コード例 #2

ファイルを表示

def main(unused):
    parser = argparse.ArgumentParser()
    parser.add_argument('embedding_path')
    parser.add_argument('vocabulary_dir')
    parser.add_argument('--training_dir')
    parser.add_argument('--validation_dir')
    parser.add_argument('--decode_dir')
    parser.add_argument('--decode_out_dir')
    parser.add_argument('--mode',
                        choices=['train', 'validate', 'decode'],
                        default='train')
    parser.add_argument('--logdir')
    parser.add_argument('--batch_size', type=int, default=30)
    parser.add_argument('--validation_interval', type=int, default=20000)
    parser.add_argument('--beam_width', type=int, default=5)
    parser.add_argument('--max_output_length', type=int, default=32)
    parser.add_argument('--target_vocabulary_size', type=int, default=20000)
    parser.add_argument('--synthetic', action='store_true')
    parser.add_argument('--allow_gpu_growth', action='store_true')
    parser.add_argument('--collect_run_metadata', action='store_true')
    parser.add_argument('--log_weight_images', action='store_true')
    options = parser.parse_args()

    if options.mode == 'decode':
        # Batching not supported in decoding
        options.batch_size = 1

    embedding_words, word_dict, word_embedding_dim = load_word_embeddings(
        options.embedding_path)

    vocabulary = Vocabulary()
    summary_vocabulary_path = path.join(options.vocabulary_dir,
                                        'summary_vocabulary.txt')
    vocabulary.add_from_file(
        summary_vocabulary_path,
        options.target_vocabulary_size - len(vocabulary.words))

    document_vocabulary_path = path.join(options.vocabulary_dir,
                                         'document_vocabulary.txt')

    # Add the most common words from vocabulary
    vocabulary.add_from_file(document_vocabulary_path, 150000)

    # Add additional common words from loaded embeddings
    vocabulary.add_words(embedding_words[:100000])

    run(options, word_dict, word_embedding_dim, vocabulary)