def get_tweet_by_title(self, param_dict): wb_down = WeiboDonwloader(self.cookies) html = wb_down.search_page(title = param_dict['title'], page = param_dict['page'], \ start = Utils.parse_input_date(param_dict['start']), end = Utils.parse_input_date(param_dict['end'])) p = WeiboUser.get_page(html) self.logger.info('GET page %d, current page %s' % (param_dict['page'], str(p))) if p != None and p < param_dict['page']: return [], True return WeiboCssParser(html, self.cookies, param_dict['root_selector'], WeiboUser.search_map, WeiboUser.search_map_end).get_weibos()
def get_tweet_by_userid(self, param_dict): wb_down = WeiboDonwloader(self.cookies) html = wb_down.person_page(uid = param_dict['uid'], page = param_dict['page']) return WeiboCssParser(html, self.cookies, param_dict['root_selector'], WeiboUser.person_map).get_weibos()
def get_comment(self, mid, page): wb_down = WeiboDonwloader(self.cookies) (html, pagenum, maxid) = wb_down.comment_page(mid = mid, page = page) return WeiboCssParser(html, self.cookies, '.list_ul > div[comment_id]', WeiboUser.comment_map).get_weibos()