python爬取表情包
需求:爬取2页表情包,网址是:https://www.fabiaoqing.com/biaoqing
上代码
import requests # 数据请求模块
import parsel # 数据解析模块
import re # 正则表达式模块 https://www.fabiaoqing.com/biaoqing/lists/page/2.html
for page in range(1,3):
url=f'https://www.fabiaoqing.com/biaoqing/lists/page/{page}.html'
headers={
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.0.0 Safari/537.36'
}
response=requests.get(url=url,headers=headers)
# print(response.text)
selector=parsel.Selector(response.text)
# print(selector)
title_list=selector.css('.tagbqppdiv img::attr(title)').getall()
# print(title_list)
url_list=selector.css('.tagbqppdiv img::attr(data-original)').getall()
for title,img_url in zip(title_list,url_list):
img_name=img_url.split('.')[-1]
title=re.sub(r'[/\:*?"<>|]','',title)
img_content=requests.get(url=img_url,headers=headers).content
with open('图片\\'+title+'.'+img_name,mode='wb') as f:
f.write(img_content)
print(title,img_url)