Ejemplo n.º 1
0
    def __init__(self):
        Config.__init__(self)
        self.memoize_articles = False
        self.fetch_images = False
        self.request_timeout = 60
        self.number_threads = 20
        self.keep_article_html = True
        self.MIN_WORD_COUNT = 20
        self.verbose = True
        self.keep_article_html = True

        self.urls = {
        'category1': [
        'a_url,articles,a_regex_for_links,a_tags',
        'b_url,article,,b.tags',
        'c_url,feed,,c.tags'
         ],
        }
        self.outputDir = 'content' + os.sep + 'category'
        self.max_number = 2000
        self.max_days = 100