def test_cue_3(): document = build_document( ( "ba "*10, "bb "*10, " sa"*8 + " bb"*10, "bb bc ba", ), (), ( "babbbc "*10, "na nb nc nd sa" + " bc"*10, " ba n"*10, ) ) summarizer = EdmundsonSummarizer() summarizer.bonus_words = ("ba", "bb", "bc",) summarizer.stigma_words = ("sa", "sb", "sc",) sentences = summarizer.cue_method(document, 5) assert list(map(to_unicode, sentences)) == [ ("ba "*10).strip(), ("bb "*10).strip(), "bb bc ba", "na nb nc nd sa bc bc bc bc bc bc bc bc bc bc", ("ba n "*10).strip(), ]
def test_cue_empty(): summarizer = EdmundsonSummarizer() summarizer.bonus_words = ("ba", "bb", "bc",) summarizer.stigma_words = ("sa", "sb", "sc",) sentences = summarizer.cue_method(build_document(), 10) assert list(map(to_unicode, sentences)) == []
def test_cue_1(): document = build_document( ("ba bb bc bb unknown ľščťžýáíé sb sc sb",) ) summarizer = EdmundsonSummarizer() summarizer.bonus_words = ("ba", "bb", "bc",) summarizer.stigma_words = ("sa", "sb", "sc",) sentences = summarizer.cue_method(document, 10) assert len(sentences) == 1
def test_cue_2(): document = build_document( ("ba bb bc bb unknown ľščťžýáíé sb sc sb",), ("Pepek likes spinach",) ) summarizer = EdmundsonSummarizer() summarizer.bonus_words = ("ba", "bb", "bc",) summarizer.stigma_words = ("sa", "sb", "sc",) sentences = summarizer.cue_method(document, 10) assert list(map(to_unicode, sentences)) == [ "ba bb bc bb unknown ľščťžýáíé sb sc sb", "Pepek likes spinach", ] sentences = summarizer.cue_method(document, 1) assert list(map(to_unicode, sentences)) == [ "ba bb bc bb unknown ľščťžýáíé sb sc sb", ]
def test_cue_letters_case(): document = build_document( ("X X X", "x x x x",), ("w w w", "W W W W",) ) summarizer = EdmundsonSummarizer() summarizer.bonus_words = ("X", "w",) summarizer.stigma_words = ("stigma",) sentences = summarizer.cue_method(document, 2) assert list(map(to_unicode, sentences)) == [ "x x x x", "W W W W", ]
def test_cue_with_no_bonus_words(): summarizer = EdmundsonSummarizer() summarizer.stigma_words = ("useless", "bad", "spinach",) with pytest.raises(ValueError): summarizer.cue_method(build_document(), 10)
def test_cue_with_no_stigma_words(): summarizer = EdmundsonSummarizer() summarizer.bonus_words = ("great", "very", "beautiful",) with pytest.raises(ValueError): summarizer.cue_method(build_document(), 10)
def test_cue_with_no_words(): summarizer = EdmundsonSummarizer() with pytest.raises(ValueError): summarizer.cue_method(build_document(), 10)