def getDateByUrl(self, url): soup = self.getSoup(url) if soup == None: return None s = soup.find("p").contents[-1].string.encode("utf-8") m = re.match(r".* ~ (.*)", s) return date_parser.parseChineseStyle(m.group(1))
def getEndDateByUrl(self, url): soup = self.getSoup(url) if soup == None: return try: s = soup.find( "strong", text=re.compile("活动时间".decode("utf-8")) ).parent.next_sibling.next_sibling.string.encode("utf-8") m = re.match(".*至(.*日)", s) if m == None: return else: return date_parser.parseChineseStyle(m.group(1)) except: pass
def getEndTime(self, url): soup = self.getSoup(url); if soup: m = re.match(r".*至(.*?日)", soup.get_text().encode("utf-8"), re.DOTALL); if m: return date_parser.parseChineseStyle(m.group(1));