# -*- coding: UTF-8 -*-
from selenium.common.exceptions import TimeoutException, NoSuchElementException, WebDriverException
from selenium.webdriver.common.by import By
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.support.wait import WebDriverWait
from selenium.webdriver.common.keys import Keys
from selenium import webdriver
from bs4 import BeautifulSoup
import urllib.request
import io
import json
import os
import requests
import sys
#用selenium模拟浏览器行为打开chrome,打开新闻首页,输入关键词,点击,然后查找下一页
# import chardet
import re
def test_sel(keyword):
driver = webdriver.Chrome()
link = 'http://news.baidu.com/?tn=news'
driver.get(link)
try:
WebDriverWait(driver, 30).until(
EC.presence_of_element_located((By.ID, "ww"))
)
except TimeoutException:
print ('加载页面失败')
try:
element = driver.find_element
用selenium爬取百度新闻
最新推荐文章于 2024-07-01 11:04:11 发布
![](https://img-home.csdnimg.cn/images/20240711042549.png)