def test_city_parser(self): s1 = "中信倍精彩活动[上海]"; s2 = "[上海]中信倍精彩活动"; s3 = None; self.assertEqual("上海", city_parser.parseBracketStyle(s1)); self.assertEqual("上海", city_parser.parseBracketStyle(s2)); self.assertEqual(None, city_parser.parseBracketStyle(s3));
def test_city_parser(self): s1 = "中信倍精彩活动[上海]" s2 = "[上海]中信倍精彩活动" s3 = None self.assertEqual("上海", city_parser.parseBracketStyle(s1)) self.assertEqual("上海", city_parser.parseBracketStyle(s2)) self.assertEqual(None, city_parser.parseBracketStyle(s3))
def fetchBankListByUrl(self, url): banks = [] f = self.openUrl(url) if f == None: return soup = BeautifulSoup(f) lis = soup.find_all("li", class_="link") for l in lis: b = Bank() a = l.find("a") href = a["href"].encode("utf-8") if href.startswith("http:"): b.url = href else: b.url = "http://creditcard.cib.com.cn" + href title = a.string.strip().encode("utf-8") b.city = city_parser.parseBracketStyle(title) if b.city in [ "兴悦会", "机票随兴订", ]: b.city = None b.title = re.sub(r"\[.*?\](.*)", r"\1", title) banks.append(b) return banks
def fetchBankListByUrl(self, url): banks = []; f = self.openUrl(url); if f == None: return; soup = BeautifulSoup(f); lis = soup.find_all("li", class_="link"); for l in lis: b = Bank(); a = l.find("a"); href = a["href"].encode("utf-8") if href.startswith("http:"): b.url = href; else: b.url = "http://creditcard.cib.com.cn" + href; title = a.string.strip().encode("utf-8"); b.city = city_parser.parseBracketStyle(title); if b.city in ["兴悦会", "机票随兴订",]: b.city = None; b.title = re.sub(r"\[.*?\](.*)", r"\1", title); banks.append(b); return banks;