import requests
import parsel
import time
import os
start = time.time() # 记录程序开始时间
# 判断文件是否存在
if not os.path.exists('./image'):
# 创建文件
os.mkdir('./image')
url = "https://fabiaoqing.com/biaoqing/lists/page/{0}.html"
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36"
}
count = 0 # 记录爬取图片数量
for i in range(1,6):
url_i = url.format(i) # 遍历多页url
response = requests.get(url=url_i,headers=headers).text # 请求数据
sel = parsel.Selector(response) # 解析
divs = sel.css(".tagbqppdiv") # 提取数据
for div in divs:
title = div.css("img.ui.image.lazy::attr(title)").get() # 提取文件名
img_url = div.css("img.ui.image.lazy::attr(data-original)").get() # 提取图片url
suffix = img_u
requests用parsel解析爬取网络表情包
最新推荐文章于 2024-06-17 17:35:06 发布