def test_dont_extract_these_results(self): """ duckduckgo suggests using google or bing if it doesn't return any results - we mustn't mistake these urls for actual search results. """ with open(join(SAMPLE_DIR, 'no_results.html'), 'r') as f: lxml_root = lxml.html.fromstring(f.read()) self.assertEqual(0, len(duckduckgo.extract_results(lxml_root)))
def test_extract_results(self): with open(join(SAMPLE_DIR, 'results_test.html'), 'r') as f: lxml_root = lxml.html.fromstring(f.read()) self.assertEqual(26, len(duckduckgo.extract_results(lxml_root)))