def get_sentence_keyword_score(document, num_sentences): rake = Rake() keywords = rake.get_keywords(document) ranked_keywords = rake.generate_keyword_rank(keywords) sufficient_keywords_length = int(math.ceil(len(ranked_keywords) / 4.0)) sufficient_keywords = ranked_keywords[:sufficient_keywords_length] total_keyword_score = 0.0 # value of a keyword is its relative score value divided by the score of all keywords sentence_keyword_score = [0.0] * num_sentences for keyword in sufficient_keywords: total_keyword_score += keyword['score'] for keyword in sufficient_keywords: sentence_keyword_score[ keyword['sentence_num']] += keyword['score'] / total_keyword_score return sentence_keyword_score
from rake import Rake rake = Rake() text = "杉山古墳(すぎやまこふん)は、奈良県奈良市大安寺にある古墳。形状は前方後円墳。大安寺古墳群を構成する古墳の1つ。国の史跡に指定されている(史跡「大安寺旧境内 附 石橋瓦窯跡」のうち)。" print(rake.get_keywords(text, 3)) """ Output Keyword List ['ぎやまこふん', '前方後円墳', '大安寺'] """