예제 #1
0
def export_vocab(tweets, vocab_size, export=True):
    words = []
    for tweet in tweets:
        words.extend(tweet)
    vocab = Word2Vec.vocab_to_num(words, vocab_size)
    if export:
        np.save('./data/vocab.npy', vocab)
    return vocab
def export_vocab(comments, categories, vocab_size, export=True):
    words = []
    for key in comments:
        words.extend(list(itertools.chain.from_iterable(comments[key])))
    for key in categories:
        words.extend(list(itertools.chain.from_iterable(categories[key])))
    vocab = Word2Vec.vocab_to_num(words, vocab_size)
    if export:
        with open("../resources/vocab.json", "w") as f:
            json.dump(vocab, f, indent=2)
    return vocab