本文共 1026 字,大约阅读时间需要 3 分钟。
需要调整的参数是新冠肺炎和page,返回一页的数据
import requestsimport pandas as pdimport jsonimport redef get_one_page(): one_page_data = [] params = { 'containerid': '100103type=60&q=新冠肺炎&t=0', 'page_type': 'searchall', 'page': 1 } url = 'https://m.weibo.cn/api/container/getIndex'# 请求api response = requests.get(url,params=params).text cards = json.loads(response)['data']['cards'] for card in cards: blog_data = card['mblog'] text = re.sub('<.*?>','',blog_data['text']) # 文章内容 mid = blog_data['mid'] # 文章id reposts_count = blog_data['reposts_count'] # 转发数 comments_count = blog_data['comments_count'] # 评论数 attitudes_count = blog_data['attitudes_count'] # 点赞数 data = [text,mid,reposts_count,comments_count,attitudes_count] column = ['text','mid','reposts_count','comments_count','attitudes_count'] one_page_data.append(dict(zip(column,data))) return one_page_dataif __name__ == '__main__': data = get_one_page() print(data)
转载地址:http://cwrf.baihongyu.com/