import requests
import time
from lxml import etree
import json
# headers = {
# 'User-Agent':'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/64.0.3282.204 Safari/537.36',
# 'Cookie':'AD_RS_COOKIE=20080918; _trs_uv=kahvgie3_6_fc6v'
# }
# main_address = "http://www.stats.gov.cn/tjsj/tjbz/tjyqhdmhcxhfdm/2020/"
def analysis_html(address, pattern):
global trs
response = requests.get(address, headers=headers)
response.encoding = 'gbk'
text = response.text
html = etree.HTML(text)
trs = html.xpath(pattern)
def make_url(url_before, pattern):
return url_before + tr.xpath(pattern)[0]
def province():
global tr
analysis_html(f'{main_address}index.html', '//tr[@class="provincetr"]/td')
for tr in trs[:-1]:
province = tr.xpath('./a/text()
python获取行政区域代码
最新推荐文章于 2022-03-23 12:16:13 发布
本文详细介绍了如何使用Python进行行政区域代码的获取,包括从网络API获取数据,解析JSON,以及存储到本地数据库的方法,为后端开发中的地理位置处理提供便利。
摘要由CSDN通过智能技术生成