import requests
from lxml import etree
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.60 Safari/537.36'
}
#爬取多页数据
for i in range(30,100):
url = 'https://pic.netbian.com/4kmeinv/index_'+str(i)+'.html'
#想爬取别的类型图片只需要更改4k后面的内容改为爬取内容的拼音
#获取响应
response = requests.get(url=url,headers=headers).text
etr = etree.HTML(response)
imgs = etr.xpath('//ul[@class="clearfix"]/li')
for img in imgs:
img_src = 'https://pic.netbian.com'+img.xpath('./a/img/@src')[0]
img_name = img.xpath('./a/b/text()')[0]
#格式处理通用方法
img_name = img_name.encode('iso-8859-1').decode('gbk')
# print(img_name,img_src)
img_data = requests.get(url=img_src,headers=headers).content
fp = open('C:\\软件\\新建文件夹\\'+img_name+'.jpg','wb')
fp.write(img_data)
print(img_name,'下载完成')
网络4K图片批量下载
最新推荐文章于 2024-10-18 00:00:00 发布