def expriment(self, path='', pagenum=100): savename = os.path.join(config.hidepath, 'res.txt') for dirname in os.listdir(path): filepath = os.path.join(path, dirname) if os.path.isdir(filepath): for f in os.listdir(filepath): fi = os.path.join(filepath, f) res = [] keywords, num = self.info(fi=fi, pagenum=pagenum) unmatch = 0 hidenum = 0 s = '\t||' for i in num: if i == 0: unmatch += 1 else: hidenum = hidenum + i s = s + '\t' + str(i) res.append(fi) res.append(str(len(keywords))) res.append(str(hidenum)) res.append(str(len(num))) res.append(str(unmatch)) res_str = '\t'.join(res) + s + '\n' FileUtil.write_apd_file(res_str, savename) FileUtil.write_apd_file(dirname + ' End !\n', savename) pass pass
def save_failed_page_url(self, new_url): if os.path.exists(self.filename): FileUtil.write_apd_file(new_url + '\n', self.filename) pass
def save_failed_content(self, new_url, new_title): content = new_url + '\t' + new_title + '\n' FileUtil.write_apd_file(content, self.file_name)