def __init__(self, url, count): # 初始化下载地址 self.url = url # 初始化爬取数据总数 self.count = count # 初始化下载器 self.downloader = downloader.Downloader() # 初始化输出器 self.outputer = outputer.Outputer()
def __init__(self): self.urls = url_manager.UrlManager() self.downloader = html_downloader.HtmlDownloader() self.parser = html_parser.HtmlParser() self.outputer = outputer.Outputer()
def __init__(self, root_url): self.root_url = root_url self.outputer = outputer.Outputer()
def __init__(self): self.urlmanager = urlmanager.UrlManager() self.htmldownloader = htmldownload.HtmlDownload() self.htmlparser = htmlparser.HtmlParser() self.outputer = outputer.Outputer()
def __init__(self, url): self.urls = url_manager.UrlManager() self.downloader = html_downloader.HtmlDownloader() self.parser = html_parser.Parser(url) self.outputer = outputer.Outputer() self.root_url = url
def __init__(self): self.outputer = outputer.Outputer()
def __init__(self): self.url_manager = url_manage.UrlManage() self.output = outputer.Outputer() self.soup = html_parser.HtmlParser()
def __init__(self): self.urls = url_manager.UrlManager() # url管理器 self.downloder = html_downloader.HtmlDownloader() # 网页下载器 self.parser = html_parser.HtmlParser() # 51JOB网页解析器 self.html_parser_zhaopin = html_parser_zhaopin.HtmlParser() # 招聘网页解析器 self.outputer = outputer.Outputer() # 结果输出
def __init__(self): self._url_manager = url_manager.URLManager() # URL 管理器 self._downloader = html_downloader.HTMLDownloader() # HTML 下载器 self._parser = html_parser.HTMLParser() # HTML 解析器 self._outputer = outputer.Outputer() # 数据采集、输出器
def __init__(self): self.downloader = downloader.Downloader() self.outputer = outputer.Outputer()