def test_recursive_filter_on(self): record = URLRecord() record.level = 0 url_filter = RecursiveFilter(enabled=True) self.assertTrue(url_filter.test(None, record)) record.level = 1 self.assertTrue(url_filter.test(None, record))
def test_recursive_filter_off(self): record = URLRecord() record.level = 0 url_filter = RecursiveFilter() self.assertTrue(url_filter.test(None, record)) record.level = 1 self.assertFalse(url_filter.test(None, record))
def test_recursive_filter_requisites(self): record = URLRecord() record.level = 0 record.inline_level = 1 url_filter = RecursiveFilter(page_requisites=True) self.assertTrue(url_filter.test(None, record))
def new_mock_url_record(): url_record = URLRecord() url_record.url = 'http://example.com' url_record.parent_url = 'http://example.com' url_record.level = 0 return url_record
def _new_url_record(cls, request: Request) -> URLRecord: '''Return new empty URLRecord.''' url_record = URLRecord() url_record.url = request.url_info.url url_record.status = Status.in_progress url_record.try_count = 0 url_record.level = 0 return url_record
def test_level_filter(self): record = URLRecord() record.level = 4 url_filter = LevelFilter(0) self.assertTrue(url_filter.test(None, record)) url_filter = LevelFilter(5) record.level = 5 self.assertTrue(url_filter.test(None, record)) record.level = 6 self.assertFalse(url_filter.test(None, record)) url_filter = LevelFilter(5) record.inline_level = 1 record.level = 5 self.assertTrue(url_filter.test(None, record)) record.level = 6 self.assertTrue(url_filter.test(None, record)) record.level = 7 self.assertTrue(url_filter.test(None, record)) record.level = 8 self.assertFalse(url_filter.test(None, record)) url_filter = LevelFilter(0) record.inline_level = 1 self.assertTrue(url_filter.test(None, record)) record.inline_level = 2 self.assertTrue(url_filter.test(None, record)) record.inline_level = 3 self.assertTrue(url_filter.test(None, record)) record.inline_level = 4 self.assertTrue(url_filter.test(None, record)) record.inline_level = 5 self.assertTrue(url_filter.test(None, record)) record.inline_level = 6 self.assertFalse(url_filter.test(None, record)) record.level = 1 url_filter = LevelFilter(0, inline_max_depth=0) record.inline_level = 1000 self.assertTrue(url_filter.test(None, record)) url_filter = LevelFilter(5, inline_max_depth=1) record.inline_level = 1 self.assertTrue(url_filter.test(None, record)) record.inline_level = 2 self.assertFalse(url_filter.test(None, record))
def to_plain(self) -> URLRecord: record = URLRecord() record.url = self.url record.parent_url = self.parent_url record.root_url = self.root_url record.status = Status(self.status) record.try_count = self.try_count record.level = self.level record.inline_level = self.inline_level record.link_type = LinkType(self.link_type) if self.link_type else None record.priority = self.priority record.post_data = self.post_data record.status_code = self.status_code record.filename = self.filename return record
def child_url_record(self, url: str, inline: bool=False, link_type: Optional[LinkType]=None, post_data: Optional[str]=None, level: Optional[int]=None): '''Return a child URLRecord. This function is useful for testing filters before adding to table. ''' url_record = URLRecord() url_record.url = url url_record.status = Status.todo url_record.try_count = 0 url_record.level = self.url_record.level + 1 if level is None else level url_record.root_url = self.url_record.root_url or self.url_record.url url_record.parent_url = self.url_record.url url_record.inline_level = (self.url_record.inline_level or 0) + 1 if inline else 0 url_record.link_type = link_type url_record.post_data = post_data return url_record