Example #1
0
def main_run(topicnum, winsize, bigrammin, trigrammin, fn):
    global topic_num, win_size, bigram_min, trigram_min, info_num, store_num, candidate_num, app_files
    topic_num = topicnum
    win_size = winsize
    bigram_min = bigrammin
    trigram_min = trigrammin
    print(topic_num, win_size, bigram_min, trigram_min, info_num, store_num,
          candidate_num)

    app_files = "file_upload/" + fn
    extract_phrases(app_files, bigram_min, trigram_min)
    load_phrase()

    timed_reviews = extract_review(app_files)
    #print(timed_reviews)

    OLDA_input = build_AOLDA_input_version(timed_reviews)
    start_t = time.time()
    apk_phis = OLDA_fit(OLDA_input, topic_num, win_size)
    phrases = generate_labeling_candidates(OLDA_input)
    topic_labeling(OLDA_input, apk_phis, phrases, 1.0, 0.75, 0.0, save=True)
    print("Totally takes %.2f seconds" % (time.time() - start_t))
Example #2
0
def save_phrase(review_path, bigram_num, trigram):
    for apk, app in app_files:
        extract_phrases(app)
Example #3
0
                    label_sent_fscore))


def sim_w(w1, w2, wv_model):
    if w1 not in wv_model or w2 not in wv_model:
        return 0.0
    return wv_model.similarity(w1, w2)


def meminfo(str):
    print(str, resource.getrusage(resource.RUSAGE_SELF).ru_maxrss / 1000)


def save_phrase(review_path, bigram_num, trigram):
    for apk, app in app_files:
        extract_phrases(app)


if __name__ == '__main__':
    extract_phrases(app_files, bigram_min, trigram_min)
    load_phrase()

    timed_reviews = extract_review()

    OLDA_input = build_AOLDA_input_version(timed_reviews)
    start_t = time.time()
    apk_phis = OLDA_fit(OLDA_input, topic_num, win_size)
    phrases = generate_labeling_candidates(OLDA_input)
    topic_labeling(OLDA_input, apk_phis, phrases, 1.0, 0.75, 0.0, save=True)
    print("Totally takes %.2f seconds" % (time.time() - start_t))
Example #4
0
        ))


def sim_w(w1, w2, wv_model):
    if w1 not in wv_model or w2 not in wv_model:
        return 0.0
    return wv_model.similarity(w1, w2)


def meminfo(str):
    print(str, resource.getrusage(resource.RUSAGE_SELF).ru_maxrss / 1000)


def save_phrase(review_path, bigram_num, trigram):
    for apk, app in app_files:
        extract_phrases(app, language=language)


if __name__ == "__main__":
    extract_phrases(app_files, bigram_min, trigram_min, language=language)
    load_phrase()

    timed_reviews = extract_review()

    OLDA_input = build_AOLDA_input_version(timed_reviews)
    start_t = time.time()
    apk_phis = OLDA_fit(OLDA_input, topic_num, win_size)
    phrases = generate_labeling_candidates(OLDA_input)
    topic_labeling(OLDA_input, apk_phis, phrases, 1.0, 0.75, 0.0, save=True)
    print("Totally takes %.2f seconds" % (time.time() - start_t))
Example #5
0
def save_phrase(review_path, bigram_num, trigram):
    extract_phrases(app_files)