def parse_author_id(self): u""" 获得author_id :return: """ author_id_href = False author_id = self.dom.select('div.blognavInfo span a') if author_id: author_id_href = ParserTools.get_attr(author_id[1], 'href') # 因为creator_id[0]是首页的链接 if not author_id_href: Debug.logger.debug(u"没有找到creator_id") # TODO return result = Match.sinablog_profile(author_id_href) sinablog_id = result.group('sinablog_people_id') self.info['author_id'] = sinablog_id