import urllib.request
import urllib.parse
header = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/97.0.4692.71 Safari/537.36 Edg/97.0.1072.62'}
ulr = 'http://www.kfc.com.cn/kfccda/ashx/GetStoreList.ashx?op=cname'
def getrequest(page):
header = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/97.0.4692.71 Safari/537.36 Edg/97.0.1072.62'}
data = {'cname': '重庆',
'pid': '',
'pageIndex': page,
'pageSize': '10'}
data = urllib.parse.urlencode(data).encode('utf-8')###unlencode():将字典信息转化为URL
###encode('utf-8')必须有post必须有
这个
return urllib.request.Request(url=ulr, data=data, headers=header)
if __name__ == '__main__':
start_page = int(input('起始页'))
stop_page = int(input('结束页'))
for page in range(start_page, stop_page + 1):
requ = getrequest(page)
response = urllib.request.urlopen(requ)
content = response.read().decode('utf-8')
with open('肯德基_第' + str(page) + '.json', 'w', encoding='utf-8') as fp:
fp.write(content)
爬虫练习POST请求(爬取肯德基信息)
最新推荐文章于 2022-07-23 20:24:03 发布