def test_paragraph2(): html = load_test_file(test_file2) extractor = ParagraphExtractor(min_len=0) text = extractor.extract(html) assert len(text) == 0
def test_paragraph1(): html = load_test_file(test_file1) extractor = ParagraphExtractor() text = extractor.extract(html) assert len(text) > 200