def test_double_standard_id_field(self): checker_rt = SchedulerRuntime() checker_rt.save() event = Event(title=u'Event 1', event_website=self.event_website, description=u'Event 1 description', url=u'http://localhost:8010/static/site_generic/event5.html', checker_runtime=checker_rt) event.save() event = Event(title=u'Event 2', event_website=self.event_website, description=u'Event 1 description', url=u'http://localhost:8010/static/site_generic/event6.html', checker_runtime=checker_rt) event.save() event = Event(title=u'Event 1', event_website=self.event_website, description=u'Event 2 description', url=u'http://localhost:8010/static/site_generic/event7.html', checker_runtime=checker_rt) event.save() self.soa_url.id_field = False self.soa_url.save() self.soa_title.id_field = True self.soa_title.save() self.soa_desc.id_field = True self.soa_desc.save() self.run_event_spider(1) self.assertEqual(len(Event.objects.all()), 6) self.assertEqual(Event.objects.filter(description='Event 1 description').count(), 2)
def test_detail_page_url_id_field(self): checker_rt = SchedulerRuntime() checker_rt.save() event = Event(title=u'Event 1', event_website=self.event_website, url=u'http://localhost:8010/static/site_generic/event5.html', checker_runtime=checker_rt) event.save() self.run_event_spider(1) self.assertEqual(len(Event.objects.all()), 5) self.assertEqual(Event.objects.filter(title='Event 1').count(), 2)
def test_double(self): checker_rt = SchedulerRuntime() checker_rt.save() event = Event(title=u'Event 1', event_website=self.event_website, url=u'http://localhost:8010/static/site_generic/event1.html', checker_runtime=checker_rt) event.save() self.run_event_spider(1) self.assertEqual(len(Event.objects.all()), 4) self.assertEqual(len(Event.objects.filter(title='Event 1')), 1)
def test_standard_update_field_update(self): checker_rt = SchedulerRuntime() checker_rt.save() event = Event(title=u'Event 1 - Old Title', event_website=self.event_website, url=u'http://localhost:8010/static/site_generic/event1.html', checker_runtime=checker_rt) event.save() self.soa_title.attr_type = 'T' self.soa_title.save() self.run_event_spider(1) event_updated = Event.objects.get(pk=event.id) self.assertEqual(event_updated.title, 'Event 1') self.assertEqual(len(Event.objects.filter(title='Event 1 - Old Title')), 0)
def test_single_standard_id_field(self): checker_rt = SchedulerRuntime() checker_rt.save() event = Event(title='Event 1', event_website=self.event_website, url='http://localhost:8010/static/site_generic/event5.html', checker_runtime=checker_rt) event.save() self.soa_url.id_field = False self.soa_url.save() self.soa_title.id_field = True self.soa_title.save() self.run_event_spider(1) self.assertEqual(len(Event.objects.all()), 4) self.assertEqual(Event.objects.filter(title='Event 1').count(), 1)
def setUpScraperJSChecker(self, path): super(ScraperJSRunTest, self).setUp() self.scraper.checker_type = 'X' self.scraper.checker_x_path = u'//div[@class="event_not_found"]/div/text()' self.scraper.checker_ref_url = u'%ssite_with_js/event_not_found.html' % path self.scraper.save() scheduler_rt = SchedulerRuntime() scheduler_rt.save() self.event = Event(title='Event 1', event_website=self.event_website, description='Event 1 description', url='%ssite_with_js/event_not_found.html' % path, checker_runtime=scheduler_rt) self.event.save()
def extraSetUpHTMLChecker(self): self.scraper.checker_type = 'X' self.scraper.checker_x_path = u'//div[@class="event_not_found"]/div/text()' self.scraper.checker_x_path_result = u'Event not found!' self.scraper.checker_ref_url = u'http://localhost:8010/static/site_with_json_content_type/event_not_found.html' self.scraper.save() scheduler_rt = SchedulerRuntime() scheduler_rt.save() self.event = Event( title='Event 1', event_website=self.event_website, description='Event 1 description', url= 'http://localhost:8010/static/site_with_json_content_type/event_not_found.html', checker_runtime=scheduler_rt) self.event.save()
def extraSetUpJSONChecker(self): self.scraper.detail_page_content_type = 'J' self.scraper.checker_type = 'X' self.scraper.checker_x_path = u'event_not_found' self.scraper.checker_x_path_result = u'Event not found!' self.scraper.checker_ref_url = u'http://localhost:8010/static/site_with_json_content_type/event_not_found.json' self.scraper.save() scheduler_rt = SchedulerRuntime() scheduler_rt.save() self.event = Event( title='Event 1', event_website=self.event_website, description='Event 1 description', url= 'http://localhost:8010/static/site_with_json_content_type/event_not_found.json', checker_runtime=scheduler_rt) self.event.save()
def setUp(self): super(CheckerRunTest, self).setUp() self.scraper.checker_type = 'X' self.scraper.checker_x_path = u'//div[@class="event_not_found"]/div/text()' self.scraper.checker_x_path_result = u'Event was deleted!' self.scraper.checker_ref_url = u'http://localhost:8010/static/site_for_checker/event_not_found.html' self.scraper.save() scheduler_rt = SchedulerRuntime() scheduler_rt.save() self.event = Event( title='Event 1', event_website=self.event_website, description='Event 1 description', url='http://localhost:8010/static/site_for_checker/event1.html', checker_runtime=scheduler_rt) self.event.save()