饿了么外卖网站是一个ajax动态加载的网站
Version1:直接页面提取
from lxml importetreeimportrequestsimportsysimporttime
reload(sys)
sys.setdefaultencoding('utf-8')
url= 'https://www.ele.me/place/ws101hcw982?latitude=22.52721&longitude=113.95232'response=requests.get(url)printresponse.status_code
time.sleep(10)
html=response.content
selector=etree.HTML(html)
rez= selector.xpath('//*[@class="place-rstbox clearfix"]')print 'haha',rez #[]
for i inrez:
Name= i.xpath('//*[@class="rstblock-title"]/text()')printname
msales= i.xpath('//*[@class="rstblock-monthsales"]/text()')
tip= i.xpath('//*[@class="rstblock-cost"]/text()')
stime= i.xpath('//*[@class="rstblock-logo"]/span/text