Example #1
0
def get_sentence_keyword_score(document, num_sentences):
    rake = Rake()
    keywords = rake.get_keywords(document)
    ranked_keywords = rake.generate_keyword_rank(keywords)
    sufficient_keywords_length = int(math.ceil(len(ranked_keywords) / 4.0))
    sufficient_keywords = ranked_keywords[:sufficient_keywords_length]
    total_keyword_score = 0.0
    # value of a keyword is its relative score value divided by the score of all keywords
    sentence_keyword_score = [0.0] * num_sentences
    for keyword in sufficient_keywords:
        total_keyword_score += keyword['score']
    for keyword in sufficient_keywords:
        sentence_keyword_score[
            keyword['sentence_num']] += keyword['score'] / total_keyword_score
    return sentence_keyword_score
Example #2
0
from rake import Rake

rake = Rake()
text = "杉山古墳(すぎやまこふん)は、奈良県奈良市大安寺にある古墳。形状は前方後円墳。大安寺古墳群を構成する古墳の1つ。国の史跡に指定されている(史跡「大安寺旧境内 附 石橋瓦窯跡」のうち)。"
print(rake.get_keywords(text, 3))
"""
Output Keyword List

['ぎやまこふん', '前方後円墳', '大安寺']
"""