예제 #1
0
def test_paragraph2():
    html = load_test_file(test_file2)
    extractor = ParagraphExtractor(min_len=0)
    text = extractor.extract(html)
    assert len(text) == 0
예제 #2
0
def test_paragraph1():
    html = load_test_file(test_file1)
    extractor = ParagraphExtractor()
    text = extractor.extract(html)
    assert len(text) > 200