def test__process_html_good_asset(self): c = Crawler("http://test.com") soup = BeautifulSoup(self.html_test_string) c._does_static_file_exist = mock.Mock(return_value=True) for asset in soup.find_all(True, src=True): c._process_html_asset(asset, "/") self.assertEqual(c._does_static_file_exist.call_count, 2) self.assertEqual(len(c.sitemap.nodes()), 3) self.assertEqual(len(c.sitemap.edges()), 2)
def test__process_html(self): soup = BeautifulSoup(self.html_test_string) c = Crawler("http://test.com") c._process_html_asset = mock.Mock() c._process_html_link = mock.Mock() c._process_html(soup) self.assertEqual(c._process_html_asset.call_count, 3) self.assertEqual(c._process_html_link.call_count, 4)