Example #1
0
    def __init__(self, config=None, debug=False):
        self.req_fields = ['title', 'descriprion', 'link']
        self.opt_for_feed = { 'language': "",					\
              'subtitle': "",					\
              'updated': "",					\
              'updated_parsed': "",   }

        self.opt_for_items = { 'published': "",				\
              'published_parsed': "",			\
              'language': "",					\
              'term': { 'field': 'tags',	\
                 'sub_field': 'term'},\
              'summary': ""     }
        self.debug = debug

        # Read config parametrs
        config_reader = ConfigReader()
        config_reader.read(config)
        self.rss_urls = config_reader.url_names
        self.freq = config_reader.freq

        # Fields that are needed to be without html tags
        self.text_extr_fields = set()
        self.__set_text_extract_fields__()

        self.cut_html = CutHTML()
        self.cut_html.reset()

        # Connect to db
        self.db_connector = DBConnector(debug=self.debug)

        # News agent name and time mark
        self.news_agent_name = ""
        # + 0000
        self.time_mark = None
	def __init__(self, config=None, debug=False):
		self.req_fields = ['title', 'descriprion', 'link']
		self.opt_for_feed = {	'language': "",					\
								'subtitle': "",					\
								'updated': "",					\
								'updated_parsed': "",			}

		self.opt_for_items = {	'published': "",				\
								'published_parsed': "",			\
								'language': "",					\
								'term': {	'field': 'tags',	\
											'sub_field': 'term'},\
								'summary': ""					}
		self.debug = debug

		# Read config parametrs
		config_reader = ConfigReader()
		config_reader.read(config)
		self.rss_urls = config_reader.url_names
		self.freq = config_reader.freq

		# Fields that are needed to be without html tags
		self.text_extr_fields = set()
		self.__set_text_extract_fields__()

		self.cut_html = CutHTML()
		self.cut_html.reset()

		# Connect to db
		self.db_connector = DBConnector(debug=self.debug)

		# News agent name and time mark
		self.news_agent_name = ""
		# + 0000
		self.time_mark = None