因为初学python,就写了简单爬虫,爬取了一些表情包,后期还会利用scrapy框架爬取小说等其他东西
废话不多说,直接上代码
#导入模块 import requests from bs4 import BeautifulSoup #定义路径 path=r'D:\斗图2' #给图片取名字,从1开始 count=1 #爬取10页表情包 for i in range(1,11): response=requests.get(r'http://www.bbsnet.com/page/'+str(i)) response.encoding='utf-8' soup=BeautifulSoup(response.text,'html.parser') # imgs=soup.find_all('img') # print(imgs) imgs=soup.select('div > div > ul > li > div > a > img') for img in imgs: if img['src'][-3:]=='gif': data=requests.get(img['src']) # print(data) #路径拼接 file=open(path+'\\'+str(count)+img['src'][-4:],'wb') file.write(data.content) file.close() count+=1