def save_prolst(self, page_number): reload(sys) sys.setdefaultencoding("utf-8") url = "http://acm.hit.edu.cn/hoj/problem/volume?page=%d" % page_number html = requests.get(url) pro_lst_page = etree.HTML(html.text) for i in range(1, 10): ID = pro_lst_page.xpath( '//*[@id="content"]/table//tr[%d]/td[2]/text()' % i) href = pro_lst_page.xpath( '//*[@id="content"]/table//tr[%d]/td[3]/a/@href' % i) title = pro_lst_page.xpath( '//*[@id="content"]/table//tr[%d]/td[3]/a/ins/text()' % i) ratio = pro_lst_page.xpath( '//*[@id="content"]/table//tr[%d]/td[5]' % i) prolst_item = problemslist( OJ="HOJ", SID=ID[0] if ID else "", title=title[0] if title else "", ratio=ratio[0].xpath('string(.)') if ratio else "", source="") prolst_item.save() prolst_item.problemID = prolst_item.id self.save_problem(str(prolst_item.SID), prolst_item.id)
def save_prolst(self, page_number): reload(sys) sys.setdefaultencoding("utf-8") url = "http://poj.org/problemlist?volume=%d"%page_number html = requests.get(url) pro_lst_page = etree.HTML(html.text) for i in range(2, 80): ID = pro_lst_page.xpath('/html/body/table[2]//tr[%d]/td[1]/text()'%i) href = pro_lst_page.xpath('/html/body/table[2]//tr[%d]/td[2]/a/@href'%i) title = pro_lst_page.xpath('/html/body/table[2]//tr[%d]/td[2]/a/text()'%i) ratio = pro_lst_page.xpath('/html/body/table[2]//tr[%d]/td[3]'%i) prolst_item = problemslist(OJ="POJ", SID=ID[0] if ID else "", title=title[0] if title else "", ratio=ratio[0].xpath('string(.)') if ratio else "", source="") prolst_item.save() prolst_item.problemID = prolst_item.id self.save_problem(str(prolst_item.SID), prolst_item.id)
def save_prolst(self, page_number): reload(sys) sys.setdefaultencoding("utf-8") url = "http://acm.hit.edu.cn/hoj/problem/volume?page=%d"%page_number html = requests.get(url) pro_lst_page = etree.HTML(html.text) for i in range(1, 10): ID = pro_lst_page.xpath('//*[@id="content"]/table//tr[%d]/td[2]/text()'%i) href = pro_lst_page.xpath('//*[@id="content"]/table//tr[%d]/td[3]/a/@href'%i) title = pro_lst_page.xpath('//*[@id="content"]/table//tr[%d]/td[3]/a/ins/text()'%i) ratio = pro_lst_page.xpath('//*[@id="content"]/table//tr[%d]/td[5]'%i) prolst_item = problemslist(OJ="HOJ", SID=ID[0] if ID else "", title=title[0] if title else "", ratio=ratio[0].xpath('string(.)') if ratio else "", source="") prolst_item.save() prolst_item.problemID = prolst_item.id self.save_problem(str(prolst_item.SID), prolst_item.id)
def save_prolst(self, page_number): reload(sys) sys.setdefaultencoding("utf-8") url = "http://poj.org/problemlist?volume=%d" % page_number html = requests.get(url) pro_lst_page = etree.HTML(html.text) for i in range(2, 80): ID = pro_lst_page.xpath( '/html/body/table[2]//tr[%d]/td[1]/text()' % i) href = pro_lst_page.xpath( '/html/body/table[2]//tr[%d]/td[2]/a/@href' % i) title = pro_lst_page.xpath( '/html/body/table[2]//tr[%d]/td[2]/a/text()' % i) ratio = pro_lst_page.xpath('/html/body/table[2]//tr[%d]/td[3]' % i) prolst_item = problemslist( OJ="POJ", SID=ID[0] if ID else "", title=title[0] if title else "", ratio=ratio[0].xpath('string(.)') if ratio else "", source="") prolst_item.save() prolst_item.problemID = prolst_item.id self.save_problem(str(prolst_item.SID), prolst_item.id)