def remove_ads_onnid_core(nid): from ads_remove import AdsExtract if len(nid) == 0: return pname, content_list = AdsExtract.get_para_on_nid(nid) #如果新闻不属于需要检查的源则返回 print len(AdsExtract.ads_dict) if pname.decode('utf-8') not in dict(AdsExtract.ads_dict).keys(): print 'not checked' return ret = AdsExtract.get_ads_paras(pname.decode('utf-8'), content_list) if len(ret) > 0: print 'begin to remove ' + nid AdsExtract.remove_ads(ret, nid)
def get(self): nid = self.get_argument('nid', None) pname, content_list = AdsExtract.get_para_on_nid(nid) ret = AdsExtract.get_ads_paras(pname, content_list) t = '' head_ads = '' tail_ads = '' if len(ret) != 0: t += nid.encode('utf-8') + '广告:' for item in ret.items(): if int(item[0].encode('utf-8')) >= 0: head_ads += ' 新闻开头广告: ' + item[1].encode('utf-8') else: tail_ads += ' 新闻结尾广告: ' + item[1].encode('utf-8') else: t = nid.encode('utf-8') + '没有检测到广告' self.render('ads_nid.html', title=str(nid.encode('utf-8')), head=t, head_ads=head_ads, tail_ads=tail_ads)
def get(self): print 'get names' page_num = json.loads(self.get_argument('page', None)) page_size = json.loads(self.get_argument('pageSize', None)) wechat_names_list = AdsExtract.get_checked_name() print len(wechat_names_list) res = {} res['total_num'] = len(wechat_names_list) if len(wechat_names_list) >= (page_num - 1) * page_size: end_num = min(page_num * page_size - 1, len(wechat_names_list) - 1) res['list'] = wechat_names_list[(page_num - 1) * page_size:end_num + 1] self.write(json.dumps(res))
def get(self): AdsExtract.save_ads_modify() #清空保存了修改微信号的set AdsExtract.modify_dict.clear()
def get(self): modify_type = self.get_argument('type') #'add'或者'delete' modify_data = self.get_argument('para') #段落号:段落内容 print 'modify ads' AdsExtract.modify_ads_results(modify_type, modify_data)
def get(self): name = self.get_argument('name', None) content = {} content['name'] = name content['list'] = AdsExtract.get_ads_of_one_wechat(name) self.write(json.dumps(content))
def get(self): print 'extract' dict_wechat = AdsExtract.get_wechat_news() AdsExtract.extract_ads(dict_wechat)
(r"/news_process/GetWechatNames", GetWechatNames), (r"/news_process/ModifyNewsAdsResults", ModifyNewsAdsResults), (r"/news_process/SaveAdsModify", SaveAdsModify), (r"/news_process/GetModifiedWechatNames", GetModifiedWechatNames), (r"/news_process/RemoveAdsOnnidCore", RemoveAdsOnnidCore), ] settings = { "template_path": "wechat-show", "static_path": os.path.join(os.path.dirname(__file__), "wechat-show"), } tornado.web.Application.__init__(self, handlers, **settings) if __name__ == "__main__": port = int(sys.argv[1]) #9996,9997用于向队列中生产; 9998用于消费;9999用于人工干预 if port == 9996 or port == 9997: http_server = tornado.httpserver.HTTPServer(AdsProcessProductApp()) http_server.listen(port) elif port == 9998: #redis_ads.consume_nid() from redis_process import nid_queue nid_queue.consume_nid_ads() elif port == 9999: AdsExtract.read_data() http_server = tornado.httpserver.HTTPServer(ManualHandleApplication()) http_server.listen(port) tornado.ioloop.IOLoop.instance().start()