可视化学习笔记 pyecharts
pyecharts 是一款强大的可视化工具, api文档为中文的,比较易学习。本次主要使用到的api为map().add(‘名称’,data,‘china/world’).
爬取丁香园数据
import json
import re
import requests
import datetime
url = 'https://ncov.dxy.cn/ncovh5/view/pneumonia'
today = datetime.date.today().strftime('%Y%m%d')
response = requests.get(url)
html = response.content.decode()
def get_internal():
url_content = re.search(r'window.getAreaStat = (.*?)}]}catch', html, re.S)
texts = url_content.group()
content = texts.replace('window.getAreaStat = ', '').replace('}catch', '')
json_data = json.loads(content)
with open(today + 'internal.json', 'w', encoding='UTF-8') as f:
json.dump(json_data, f, ensure_ascii=False)
def get_external():
url_content = re.search(r'window.getListByCountryTypeService2true = (.*?)}]}catch', html, re.S)
texts = url_content.group()
content = texts.replace('window.getListByCountryTypeService2true = ', '').replace('}catch', '')
json_data = json.loads(content)
with open(today + 'external.json', 'w', encoding='UTF-8') as f:
json.dump(json_data, f, ensure_ascii=False)
if __name__ == '__main__':
get_internal()
get_external()
爬取结果
国内结果示例
国外结果示例