def __init__(self, url, cached=True): logging.debug('parsing:' + url) self.images = None self.links = None self.texts = None if url: self.url = url.strip() self.loadPage(cached) self.parser = HtmlParser() self.parser.set_html(path(self.page).text())