def __op_rejudge_done(self, data_loaded, connection): item_id = int(data_loaded['id']) decision = int(data_loaded['decision']) item = UrlItem.load(id=item_id) del self.__ext_queue[item_id] self.__send_back_to_judge(item, decision) tool.send_msg(connection, "0") pass
def __op_rejudge_done(self, data_loaded, connection): item_id = int(data_loaded['id']) decision = int(data_loaded['decision']) item = UrlItem.load(id=item_id) del self.__ext_queue[item_id] self.__send_back_to_judge(item, decision) tool.send_msg(connection, "0") pass
def __refresh_list(self): delete_ids = [] for key, ent in self.__judge_queue.iteritems(): decision, confidence = self.__auto_judge(ent['feature']) if confidence > config.const_CONFIDENCE_THRESHOLD: item = UrlItem.load(id=key) item['is_target'] = decision item.save() delete_ids.append(key) if int(item['is_target']) in [config.const_IS_TARGET_MULTIPLE, config.const_IS_TARGET_SIGNLE]: self.__send_to_extractor(item) else: os.remove(config.path_judge_inbox + "/%s" % ent['filename']) else: self.__judge_queue[key]['confidence'] = confidence self.__judge_queue[key]['decision'] = decision for ent_id in delete_ids: del self.__judge_queue[ent_id]
def __op_done(self, data_loaded, connection): item_id = int(data_loaded['id']) decision = int(data_loaded['decision']) item = UrlItem.load(id=item_id) item['is_target'] = decision item.save() if int(item['is_target']) in [config.const_IS_TARGET_MULTIPLE, config.const_IS_TARGET_SIGNLE]: self.__send_to_extractor(item) else: os.remove(config.path_judge_inbox + "/%s" % item.filename()) self.__relearn_clf(self.__judge_queue[item_id]['feature'],decision) del self.__judge_queue[item_id] tool.send_msg(connection, "0") pass
def __op_done(self, data_loaded, connection): item_id = int(data_loaded['id']) decision = int(data_loaded['decision']) item = UrlItem.load(id=item_id) item['is_target'] = decision item.save() if int(item['is_target']) in [ config.const_IS_TARGET_MULTIPLE, config.const_IS_TARGET_SIGNLE ]: # item is target self.__send_to_extractor(item) else: # item is not target os.remove(config.path_judge_inbox + "/%s" % item.filename()) self.__relearn_clf(self.__judge_queue[item_id]['feature'], decision) del self.__judge_queue[item_id] tool.send_msg(connection, "0") pass
def __refresh_list(self): delete_ids = [] for key, ent in self.__judge_queue.iteritems(): decision, confidence = self.__auto_judge(ent['feature']) if confidence > config.const_CONFIDENCE_THRESHOLD: # pretty sure, save to db, and pass to extract item = UrlItem.load(id=key) item['is_target'] = decision item.save() delete_ids.append(key) if int(item['is_target']) in [ config.const_IS_TARGET_MULTIPLE, config.const_IS_TARGET_SIGNLE ]: self.__send_to_extractor(item) else: os.remove(config.path_judge_inbox + "/%s" % ent['filename']) else: self.__judge_queue[key]['confidence'] = confidence self.__judge_queue[key]['decision'] = decision # clear delete_ids for ent_id in delete_ids: del self.__judge_queue[ent_id]