import requests
from lxml import etree
from openpyxl import Workbook
import json
#1 获取数据
result =requests.get('https://voice.baidu.com/act/newpneumonia/newpneumonia')
#print(result.text)
#2解析数据
html = etree.HTML(result.text)
res = html.xpath('//script[@type="application/json"]/text()')
#print(res[0])
# print(type(res))
# print(type(res[0]))
res = json .loads(res[0])
#print(res)
#3保存
wb = Workbook()
#print(res['component'][0]['globallist'])
res = res['component'][0]['caseList']
for each in res:
print(each)
print('*'*50,'\n')
sheet_title = each['area']
ws = wb.create_sheet(sheet_title)
ws.append(['地区','累计确诊','累计死亡','累计治愈','现有确诊','新增确诊'])
#print(sheet_title)
for each in each['subList']:
print(each)
print('*' * 60, '\n')
ws.append([each['city'],each['confirmed'],each['died'],
each['crued'],each['curConfirm'],each['confirmedRelative']])
wb.save('2022527国内疫情数据.xlsx')
guoneiyiqin
最新推荐文章于 2024-07-23 20:40:26 发布