def get_one_topic_from2(url, desc, dir_path): response = Req.post(url) data = response.text print(url) if json.loads(data).get('ok') == 0: return contents = json.loads(data).get('data').get('cards') for content in contents: mblog = content.get('mblog') # id = mblog.get('id') title = mblog.get('text') time = time_handler(mblog.get('created_at')) comments_count = mblog.get('comments_count') reposts_count = mblog.get('reposts_count') attitudes_count = mblog.get('attitudes_count') soup = BeautifulSoup(title) user_name = mblog.get('user').get('screen_name') print(user_name + " " + time + " " + soup.get_text()) csv_c = { '用户名': user_name, '文本内容': soup.get_text(), '发布时间': time, '点赞数': attitudes_count, '评论数': comments_count, '转发数': reposts_count } write_csv_rows(csv_headers, csv_c, desc, dir_path)
def get_one_topic_first_page(url, desc, dir_path): print("搜索话题[" + desc + "]的第1页") response = Req.post(url) data = response.text contents = json.loads(data).get('data').get('cards') print(url) for content in contents: card_group = content.get('card_group') if card_group is None: continue mblog = card_group[0].get('mblog') if mblog is None: continue # id = mblog.get('id') title = mblog.get('text') time = time_handler(mblog.get('created_at')) comments_count = mblog.get('comments_count') reposts_count = mblog.get('reposts_count') attitudes_count = mblog.get('attitudes_count') soup = BeautifulSoup(title) user_name = mblog.get('user').get('screen_name') print(user_name + " " + time + " " + soup.get_text()) csv_c = { '用户名': user_name, '文本内容': soup.get_text(), '发布时间': time, '点赞数': attitudes_count, '评论数': comments_count, '转发数': reposts_count } write_csv_rows(csv_headers, csv_c, desc, dir_path)