import requests
from lxml import etree
url='http://desk.zol.com.cn/meinv/'
add1='.html'
urls=[]
i = 0
for i in range(1,100):
urls.append(url+str(i)+add1)
for url in urls:
print("正在爬取"+url)
html=requests.get(url)
html.encoding='gb2312'#从网页源代码可知网页的编码形式为gb2312,因此设置解码方式为gb2312
txt=html.text#获取文本文件
txtx=etree.HTML(txt)
liss=txtx.xpath('/html/body/div/div/ul/li/a/img/@src')
for lis in liss:
con=requests.get(lis)
hhh=con.content#获取二进制文件
name='D:/picture/'+str(i)+'.jpg'
with open(name,'wb') as fp:
fp.write(hhh)
i=i+1
结果: