Пример #1
0
class TestCrawlTask(unittest.TestCase):

    def setUp(self):
        self._url = URL('ftp://deltha.uh.cu/')
        self._site_id = 'aa958756e769188be9f76fbdb291fe1b2ddd4777'
        self._task = CrawlTask(self._site_id, self._url)

    def test_properties(self):
        self.assertEquals(self._task.site_id, self._site_id)
        self.assertEquals(str(self._task.url), str(self._url))
        self.assertEquals(self._task.revisit_wait, 0)
        self.assertEquals(self._task.revisit_count, -1)
        self.assertEquals(self._task.change_count, 0)

    def test_pickling(self):
        task = pickle.loads(pickle.dumps(self._task))
        self.assertEquals(self._task.site_id, task.site_id)
        self.assertEquals(str(self._task.url), str(task.url))
        self.assertEquals(self._task.revisit_wait, task.revisit_wait)
        self.assertEquals(self._task.revisit_count, task.revisit_count)
        self.assertEquals(self._task.change_count, task.change_count)

    def test_revisit_wait(self):
        self._task.report_visit(True)
        self._task.report_visit(False)
        self._task.revisit_wait = 60
        self.assertEquals(self._task.revisit_wait, 60)

    def test_reset_counters(self):
        self._task.report_visit(True)
        self._task.report_visit(True)
        self._task.revisit_wait = 60
        self._task.reset_change_count()
        self.assertEquals(self._task.revisit_wait, 60)
        self.assertEquals(self._task.revisit_count, 1)
        self.assertEquals(self._task.change_count, 0)

    def test_report_visit(self):
        self._task.report_visit(True)
        # Reporting visit without changes.
        self._task.report_visit(False)
        self._task.report_visit(False)
        self.assertEquals(self._task.revisit_count, 2)
        self.assertEquals(self._task.change_count, 0)
        # Reporting visits with changes.
        self._task.report_visit(True)
        self._task.report_visit(True)
        self.assertEquals(self._task.revisit_count, 4)
        self.assertEquals(self._task.change_count, 2)
Пример #2
0
class TestCrawlTask(unittest.TestCase):
    def setUp(self):
        self._url = URL('ftp://deltha.uh.cu/')
        self._site_id = 'aa958756e769188be9f76fbdb291fe1b2ddd4777'
        self._task = CrawlTask(self._site_id, self._url)

    def test_properties(self):
        self.assertEquals(self._task.site_id, self._site_id)
        self.assertEquals(str(self._task.url), str(self._url))
        self.assertEquals(self._task.revisit_wait, 0)
        self.assertEquals(self._task.revisit_count, -1)
        self.assertEquals(self._task.change_count, 0)

    def test_pickling(self):
        task = pickle.loads(pickle.dumps(self._task))
        self.assertEquals(self._task.site_id, task.site_id)
        self.assertEquals(str(self._task.url), str(task.url))
        self.assertEquals(self._task.revisit_wait, task.revisit_wait)
        self.assertEquals(self._task.revisit_count, task.revisit_count)
        self.assertEquals(self._task.change_count, task.change_count)

    def test_revisit_wait(self):
        self._task.report_visit(True)
        self._task.report_visit(False)
        self._task.revisit_wait = 60
        self.assertEquals(self._task.revisit_wait, 60)

    def test_reset_counters(self):
        self._task.report_visit(True)
        self._task.report_visit(True)
        self._task.revisit_wait = 60
        self._task.reset_change_count()
        self.assertEquals(self._task.revisit_wait, 60)
        self.assertEquals(self._task.revisit_count, 1)
        self.assertEquals(self._task.change_count, 0)

    def test_report_visit(self):
        self._task.report_visit(True)
        # Reporting visit without changes.
        self._task.report_visit(False)
        self._task.report_visit(False)
        self.assertEquals(self._task.revisit_count, 2)
        self.assertEquals(self._task.change_count, 0)
        # Reporting visits with changes.
        self._task.report_visit(True)
        self._task.report_visit(True)
        self.assertEquals(self._task.revisit_count, 4)
        self.assertEquals(self._task.change_count, 2)