示例#1
0
文件: spider.py 项目: monocleman1/dd
 def _get_allowed_domains(self, spec):
     urls = [x['url'] for x in spec['templates']]
     urls += [
         x['url'] for x in spec.get('init_requests', [])
         if x['type'] == 'start'
     ]
     urls += self._start_urls.allowed_domains
     return [domain for scheme, domain in iter_unique_scheme_hostname(urls)]
示例#2
0
 def _get_allowed_domains(self, templates):
     urls = [x['url'] for x in templates]
     urls += [x.url for x in self._start_requests]
     return [x[1] for x in iter_unique_scheme_hostname(urls)]
示例#3
0
文件: spider.py 项目: widy28/portia
 def _get_allowed_domains(self, templates):
     urls = [x['url'] for x in templates]
     urls += [x.url for x in self._start_requests]
     return [x[1] for x in iter_unique_scheme_hostname(urls)]
示例#4
0
 def _get_allowed_domains(self, templates):
     urls = [x.url for x in templates]
     urls += self.start_urls
     return [x[1] for x in iter_unique_scheme_hostname(urls)]
示例#5
0
 def _get_allowed_domains(self, templates):
     urls = [x.url for x in templates]
     urls += self.start_urls
     return [x[1] for x in iter_unique_scheme_hostname(urls)]
示例#6
0
 def _get_allowed_domains(self, spec):
     urls = [x['url'] for x in spec['templates']]
     urls += [x['url'] for x in spec.get('init_requests', [])
              if x['type'] == 'start']
     urls += self._start_urls.allowed_domains
     return [domain for scheme, domain in iter_unique_scheme_hostname(urls)]