import urllib.request import os import pyexcel_xls from bs4 import BeautifulSoup def crawler(url): headers = { "Accept": "application/json, text/javascript, */*; q=0.01", "X-Requested-With": "XMLHttpRequest", "User-Agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/59.0.3071.115 Safari/537.36", "Content-Type": "application/x-www-form-urlencoded; charset=UTF-8" } headersurl=urllib.request.Request(url,headers=headers) dataopen=urllib.request.urlopen(headersurl) #利用BeautifulSoup来分析数据 bsoup=BeautifulSoup(dataopen,"html.parser") datas=bsoup.find_all("div",{"class":"card-box"}) biglist=[] for x in datas: title=x.find("div",{"class":"card-img"}).find("a").get("title") titleimg=x.find(&#
python爬虫利用BeautifulSoup获取站酷图片网站的全部内容
最新推荐文章于 2022-05-23 21:01:48 发布