示例#1
0
 def test_spidername_time(self):
     formatted = _format("Spider: $spider:name. Item scraped at $time",
                         self.spider, self.response, self.item, {})
     self.assertRegexpMatches(
         formatted,
         'Spider: myspider. Item scraped at \d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}$'
     )
示例#2
0
 def test_response(self):
     formatted = _format("$response:url", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, self.response.url)
示例#3
0
 def test_invalidattr(self):
     formatted = _format("Argument arg2: $spider:arg2", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "Argument arg2: $spider:arg2")
示例#4
0
 def test_noargs(self):
     """If entity does not accept arguments, don't substitute"""
     formatted = _format("Scraped on day $unixtime:arg", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "Scraped on day $unixtime:arg")
示例#5
0
 def test_settings(self):
     formatted = _format("$setting:MY_SETTING", self.spider, self.response, self.item, {"$setting": {"MY_SETTING": True}})
     self.assertEqual(formatted, 'True')
示例#6
0
 def test_spiderarg(self):
     formatted = _format("Argument arg1: $spider:arg1", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, 'Argument arg1: val1')
示例#7
0
 def test_isotime(self):
     formatted = _format("$isotime", self.spider, self.response, self.item, {})
     self.assertRegexpMatches(formatted, '\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}\.\d{6}$')
示例#8
0
 def test_spidername_time(self):
     formatted = _format("Spider: $spider:name. Item scraped at $time", self.spider, self.response, self.item, {})
     self.assertRegexpMatches(formatted, 'Spider: myspider. Item scraped at \d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}$')
示例#9
0
 def test_spiderattr(self):
     formatted = _format("$spider:start_urls", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "['http://example.com']")
示例#10
0
 def test_spiderarg(self):
     formatted = _format("Argument arg1: $spider:arg1", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, 'Argument arg1: val1')
示例#11
0
 def test_jobid(self):
     os.environ["SCRAPY_JOB"] = 'aa788'
     formatted = _format("job id '$jobid' for spider $spider:name", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "job id 'aa788' for spider myspider")
示例#12
0
 def test_isotime(self):
     formatted = _format("$isotime", self.spider, self.response, self.item, {})
     self.assertRegexpMatches(formatted, '\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}\.\d{6}$')
示例#13
0
 def test_unixtime(self):
     formatted = _format("Item scraped at $unixtime", self.spider, self.response, self.item, {})
     self.assertRegexpMatches(formatted, 'Item scraped at \d+\.\d+$')
示例#14
0
 def test_hello(self):
     self.assertEqual(_format("hello world!", self.spider, self.response, self.item, {}), 'hello world!')
示例#15
0
 def test_regex(self):
     formatted = _format("$field:url,r'item_no=(\d+)'", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, '345')
示例#16
0
 def test_fields_copy(self):
     formatted = _format("$field:nom", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, 'myitem')
示例#17
0
 def test_hello(self):
     self.assertEqual(_format("hello world!", self.spider, self.response, self.item, {}), 'hello world!')
示例#18
0
 def test_settings(self):
     formatted = _format("$setting:MY_SETTING", self.spider, self.response, self.item, {"$setting": {"MY_SETTING": True}})
     self.assertEqual(formatted, 'True')
示例#19
0
 def test_unixtime(self):
     formatted = _format("Item scraped at $unixtime", self.spider, self.response, self.item, {})
     self.assertRegexpMatches(formatted, 'Item scraped at \d+\.\d+$')
示例#20
0
 def test_notexisting(self):
     """Not existing entities are not substituted"""
     formatted = _format("Item scraped at $myentity", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, 'Item scraped at $myentity')
示例#21
0
 def test_jobid(self):
     os.environ["SCRAPY_JOB"] = 'aa788'
     formatted = _format("job id '$jobid' for spider $spider:name", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "job id 'aa788' for spider myspider")
示例#22
0
 def test_noargs(self):
     """If entity does not accept arguments, don't substitute"""
     formatted = _format("Scraped on day $unixtime:arg", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "Scraped on day $unixtime:arg")
示例#23
0
 def test_spiderattr(self):
     formatted = _format("$spider:start_urls", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "['http://example.com']")
示例#24
0
 def test_noargs2(self):
     """If entity does not have enough arguments, don't substitute"""
     formatted = _format("$spider", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "$spider")
示例#25
0
 def test_notexisting(self):
     """Not existing entities are not substituted"""
     formatted = _format("Item scraped at $myentity", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, 'Item scraped at $myentity')
示例#26
0
 def test_invalidattr(self):
     formatted = _format("Argument arg2: $spider:arg2", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "Argument arg2: $spider:arg2")
示例#27
0
 def test_noargs2(self):
     """If entity does not have enough arguments, don't substitute"""
     formatted = _format("$spider", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "$spider")
示例#28
0
 def test_environment(self):
     os.environ["TEST_ENV"] = "testval"
     formatted = _format("$env:TEST_ENV", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "testval")
示例#29
0
 def test_environment(self):
     os.environ["TEST_ENV"] = "testval"
     formatted = _format("$env:TEST_ENV", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, "testval")
示例#30
0
 def test_response(self):
     formatted = _format("$response:url", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, self.response.url)
示例#31
0
 def test_fields_copy(self):
     formatted = _format("$field:nom", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, 'myitem')
示例#32
0
 def test_regex(self):
     formatted = _format("$field:url,r'item_no=(\d+)'", self.spider, self.response, self.item, {})
     self.assertEqual(formatted, '345')