def test_duplicate(self): html = load_regression_data('duplicate-page-duplicate.html') page = r.fragment_fromstring(html) self.assertTrue(r.is_suspected_duplicate(self._article, page))
def setUp(self): super(TestIsSuspectedDuplicate, self).setUp() html = load_regression_data('duplicate-page-article.html') self._article = r.fragment_fromstring(html)