前言
生活索然无味,我们要留住快乐!
一、打开糗事百科热图
二、查看网页源码
代码
import requests
import re
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.75 Safari/537.36'}
url="https://www.qiushibaike.com/imgrank/page/%d/"
for pagenum in range(1,5):
new_url = format(url%pagenum)
response = requests.get(url=new_url,headers=headers).text
ex= '<div class="thumb">.*?<img src="(.*?)" alt.*?</div>'
img_list = re.findall(ex,response,re.S)
for pages in img_list:
pages = "https:"+pages
url1=pages
response1=requests.get(url=url1,headers=headers).content
filename = pages.split('/')[-1]
img_path="./图片/"+filename
with open(img_path,"wb") as fp:
fp.write(response1)
print("爬取成功")
运行结果