import requests
from bs4 import BeautifulSoup
headers = {
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.102 Safari/537.36'
}
def download_one(url,I):
response = requests.get(url, headers=headers)
text = response.content.decode('gbk')
soup = BeautifulSoup(text, 'lxml')
div = soup.find_all(name='div', attrs={'class': 'articleV4Body'})[0]
img = div.find_all('img')[0]
lianjie = img['src']
next_url = div.find_all('a')[0]['href']
print(next_url)
R = requests.get(lianjie)
with open('图片/{}.jpg'.format(I),'wb') as f:
f.write(R.content)
return next_url
if __name__ == '__main__':
I = 0
base_url = 'https://www.27270.com/beautiful/beijingtupian/2018/'
next_url1 = '313727_1.html'
next_url2 = download_one(base_url + next_url1,I)
I = I+1
while next_url1 != next_url2:
next_url1 = next_url2
next_url2 = download_one(base_url+next_url2,I)
I = I+1
爬取27270壁纸
最新推荐文章于 2022-10-25 21:47:39 发布