from bs4 import BeautifulSoup as bf
import urllib.request
import time
#创建网址队列
url_list = []
for i in range(1,11):
url = 'http://www.27270.com/tag/566_%d.html'%i
url_list.append(url)
for url in url_list: #第一层:每一个包含很多小图的页面
try:
response = urllib.request.urlopen(url)#读取网址
html = response.read()
soup = bf(html)#创建BeautifulSoup对象
li_list = soup.find_all('li')
href_list = []
for li in li_list: #第二层:进入每一个小图对应的大图页面
if li.a != None:
try:
href_list.append(li.a['href']) #将大图页面地址入列
except:
pass
for href in href_list:
# secondHrefList = [] 先不爬所有大图了,还不会正则
ImgHrefHtml = urllib.request.urlopen(href).read()
ImgSoup = bf(ImgHrefHtml)
urllib.request.urlretrieve(ImgSoup.img['src'],filename='C:\\Users\\user\\Desktop\\新建文件夹\\%s.jpg'%ImgSoup.img['alt'])
except:
pass
Python爬美女图库
最新推荐文章于 2022-05-05 20:29:47 发布