入门小菜鸟的学习笔记,希望大佬们帮忙纠错啦~侵权立删。
一、加载库
import re
import time
import json
import requests
import pandas as pd
import numpy as np
from pyecharts.charts import Map
from pyecharts import options as opts
二、发送请求,获取文本数据
url = 'https://voice.baidu.com/act/newpneumonia/newpneumonia/?from=osari_aladin_banner'
headers = {
'user-agent':'XXXXX' #请求头自行获取哦
}
response = requests.get(url=url,headers=headers)
data = response.text
三、解析数据
data = re.findall('"component":\[(.*)\],',data)[0]
json_data = json.loads(data)
四、获取并保存数据
Data = pd.DataFrame()
final_data = json_data['caseList']
for i in final_data: