Пример #1
0
 def ExtractNews(self,count=10):               
     n = NewsWorker()
     items = n.GetUnextractedNews(count)
     for item in items:
         try:
             url =  item.url
             print(url)
             id =  item.id
             tag_name = item.tag_name
             tag_class = item.tag_class
             tag_id = item.tag_id
            
             page = GetData(url)              
             text,html = self.Extract(page.decode('utf-8'),tag_name,tag_class,tag_id)                
             
             n.AddContent(id, MysqlStr(html), MysqlStr(text))
         except Exception as ex:
             Setting.error_log.LogException(ex)
         return