#coding=utf8
from lxml import etree
from scrapy import *
from selenium import webdriver
#from selenium.webdriver.common.by import By
#进行编码
# import sys
# reload(sys)
# sys.setdefaultencoding('utf-8')
#启动浏览器
# browser = webdriver.Firefox()
#无法使用PhantomJS
# browser = webdriver.PhantomJS()
#设置火狐的无头浏览器
fireFoxOptions = webdriver.FirefoxOptions()
fireFoxOptions.set_headless()
browser = webdriver.Firefox(firefox_options=fireFoxOptions)
url="https://news.baidu.com/news?fr=mohome&ssid=0&from=844b&uid=&pu=sz%401320_2001%2Cta%40iphone_1_10.3_3_603&bd_page_type=1#/detail/12896848575392312266"
#发出请求
browser.get(url)
#获得请求回来的内容
html = browser.page_source
# print(browser.status_code)
#提取数据
S = etree.HTML(html)
L = S.xpath("//*[@id='newsDetailContent']/p")
print(L)
#显示数据
for i in L:
print(i.xpath("text()")[0])
#关闭浏览器
browser.close()
from lxml import etree
from scrapy import *
from selenium import webdriver
#from selenium.webdriver.common.by import By
#进行编码
# import sys
# reload(sys)
# sys.setdefaultencoding('utf-8')
#启动浏览器
# browser = webdriver.Firefox()
#无法使用PhantomJS
# browser = webdriver.PhantomJS()
#设置火狐的无头浏览器
fireFoxOptions = webdriver.FirefoxOptions()
fireFoxOptions.set_headless()
browser = webdriver.Firefox(firefox_options=fireFoxOptions)
url="https://news.baidu.com/news?fr=mohome&ssid=0&from=844b&uid=&pu=sz%401320_2001%2Cta%40iphone_1_10.3_3_603&bd_page_type=1#/detail/12896848575392312266"
#发出请求
browser.get(url)
#获得请求回来的内容
html = browser.page_source
# print(browser.status_code)
#提取数据
S = etree.HTML(html)
L = S.xpath("//*[@id='newsDetailContent']/p")
print(L)
#显示数据
for i in L:
print(i.xpath("text()")[0])
#关闭浏览器
browser.close()