def test_get_page_text_with_text(self): doc = ET.fromstring('<head>text<sub>subtext</sub></head>') page = SimulatedPage(doc) self.assertEqual(list(utils.get_page_text(page)), ['text', 'subtext'])
def test_get_page_text_with_text(self): page = SimulatedPage() doc = ET.fromstring('<head>text<sub>subtext</sub></head>') page.document = doc self.assertEqual(list(utils.get_page_text(page)), ['text', 'subtext'])
def test_get_page_text_no_text(self): doc = ET.fromstring('<head><sub></sub></head>') page = SimulatedPage(doc) self.assertEqual(list(utils.get_page_text(page)), [])
def test_get_page_text_no_text(self): page = SimulatedPage() doc = ET.fromstring('<head><sub></sub></head>') page.document = doc self.assertEqual(list(utils.get_page_text(page)), [])