def main_run(topicnum, winsize, bigrammin, trigrammin, fn): global topic_num, win_size, bigram_min, trigram_min, info_num, store_num, candidate_num, app_files topic_num = topicnum win_size = winsize bigram_min = bigrammin trigram_min = trigrammin print(topic_num, win_size, bigram_min, trigram_min, info_num, store_num, candidate_num) app_files = "file_upload/" + fn extract_phrases(app_files, bigram_min, trigram_min) load_phrase() timed_reviews = extract_review(app_files) #print(timed_reviews) OLDA_input = build_AOLDA_input_version(timed_reviews) start_t = time.time() apk_phis = OLDA_fit(OLDA_input, topic_num, win_size) phrases = generate_labeling_candidates(OLDA_input) topic_labeling(OLDA_input, apk_phis, phrases, 1.0, 0.75, 0.0, save=True) print("Totally takes %.2f seconds" % (time.time() - start_t))
def save_phrase(review_path, bigram_num, trigram): for apk, app in app_files: extract_phrases(app)
label_sent_fscore)) def sim_w(w1, w2, wv_model): if w1 not in wv_model or w2 not in wv_model: return 0.0 return wv_model.similarity(w1, w2) def meminfo(str): print(str, resource.getrusage(resource.RUSAGE_SELF).ru_maxrss / 1000) def save_phrase(review_path, bigram_num, trigram): for apk, app in app_files: extract_phrases(app) if __name__ == '__main__': extract_phrases(app_files, bigram_min, trigram_min) load_phrase() timed_reviews = extract_review() OLDA_input = build_AOLDA_input_version(timed_reviews) start_t = time.time() apk_phis = OLDA_fit(OLDA_input, topic_num, win_size) phrases = generate_labeling_candidates(OLDA_input) topic_labeling(OLDA_input, apk_phis, phrases, 1.0, 0.75, 0.0, save=True) print("Totally takes %.2f seconds" % (time.time() - start_t))
)) def sim_w(w1, w2, wv_model): if w1 not in wv_model or w2 not in wv_model: return 0.0 return wv_model.similarity(w1, w2) def meminfo(str): print(str, resource.getrusage(resource.RUSAGE_SELF).ru_maxrss / 1000) def save_phrase(review_path, bigram_num, trigram): for apk, app in app_files: extract_phrases(app, language=language) if __name__ == "__main__": extract_phrases(app_files, bigram_min, trigram_min, language=language) load_phrase() timed_reviews = extract_review() OLDA_input = build_AOLDA_input_version(timed_reviews) start_t = time.time() apk_phis = OLDA_fit(OLDA_input, topic_num, win_size) phrases = generate_labeling_candidates(OLDA_input) topic_labeling(OLDA_input, apk_phis, phrases, 1.0, 0.75, 0.0, save=True) print("Totally takes %.2f seconds" % (time.time() - start_t))
def save_phrase(review_path, bigram_num, trigram): extract_phrases(app_files)