下载http://pic.yxdown.com/list/0_0_4.html网站图片并保存:
用到的库:requests,beautifulsoup
import requests
import re
from bs4 import BeautifulSoup
#设置初始url
baseurl='http://pic.yxdown.com/list/'
urls=[]
#拼接前20页的url
for i in range(20):
url=baseurl+'0_0_'+str(i)+'.html'
urls.append(url)
names=[]
links=[]
#获取每页的html,解析HTML
for url in urls:
html=requests.get(url)
html=html.text.lstrip()
soup=BeautifulSoup(html,'lxml')
objs=soup.find_all('a',class_='proimg')
#获取图片链接和名称
for obj in objs:
link=obj.find('img').get('src')
name=obj.find('img').get('alt')
links.append(link)
names.append(name)
#用get方法获取图片并保存,文件名为图片名
for lianjie in links:
html=requests.get(lianjie)
filename=name+'.jpg'
with open(filename,'wb') as f:
f.write(html.content)
爬去结果:
![在这里插入图片描述](https://img-blog.csdnimg.cn/201902191606533.png)