思路:
1、获取JS源代码
2、获取英雄ID
3、拼接完整路径
4、下载的位置
5、下载
import requests
import re
import json
#获取JS源代码
def download_image():
js_url = 'https://lol.qq.com/biz/hero/champion.js'
js_html = requests.get(js_url).text
#状态码 200:请求成功 404:页面未找到
# print(js_html)
# 正则表达式
req = r'"keys":(.*?),"data"'
hero_list = re.findall(req,js_html)
#字符串
hero_list = hero_list[0]
#str-->json
dict_hero = json.loads(hero_list)
#获取英雄ID
list_hero_url = []
for hero_id in dict_hero:
#print(hero_id)
for i in range(20):
i = str(i)
if len(i) == 1:
hero_num = "00" + i
elif len(i) == 2:
hero_num = "0" + i
url = 'https://ossweb-img.qq.com/images/lol' \
'/web201310/skin/big'+ hero_id + hero_num +'.jpg'
list_hero_url.append(url)
#print(list_hero_url)
#拼接
file_path = []
for hero_name in dict_hero.values():
print(hero_name)
path = r'C:\Users\Administrator\PycharmProjects\Test1\2018_11_16爬虫练习\LOLpic\\'
for i in range(20):
files = path + hero_name + str(i) + ".jpg"
file_path.append(files)
#下载
num = 0
for i in list_hero_url:
# print(i)
if requests.get(i).status_code == 200:
content = requests.get(i).content
#print(content) 二进制文件
# print("正在下载%s"%file_path[num])
f = open(file_path[num],'wb')
f.write(content)
f.close()
num += 1
def main():
download_image()
if __name__ == '__main__':
main()
完成效果如下图: