我去爬了智能招聘的网站,但是用下面那个代码爬到10面的时候,就不能够得到网址
importrequestsfrombs4importBeautifulSoupimportredefgetHttp(url) :try:
dic={'User-Agent':'Google/10.0'}
r=requests.get(url,headers=dic)
r.raise_for_status()
r.encoding=r.apparent_encodingreturnr.textexcept:return""url="http://sou.zhaopin.com/jobs/searchresult.ashx?kw=%E7%BD%91%E7%BB%9C%E5%B7%A5%E7%A8%8B%E5%B8%88&sm=0&sg=78e9eafcaf414ca294d30b64548bf27d&p="list=list(range(90))
unlion=[]defgeturl(demo,list) :
tempurl=re.findall(r"http://jobs.zhaopin.com/\d{15}\Whtm",str(demo))forlist1intempurl :print(list1)foriinlist[1:] :
http=url+str(i)print(http,i)
demo = getHttp(http)
geturl(demo,list)
修改