from selenium import webdriver
import time
import random
获取网页
driver = webdriver.Chrome()
url = ‘https://www.jd.com’
driver.get(url)
搜索输入框
tb_input = driver.find_element_by_css_selector(’#key’)
搜索按钮
search_btn = driver.find_element_by_css_selector(’.button’)
需要搜索的内容
tb_input.send_keys(‘无人机’)
设置休眠时间
time.sleep(2)
search_btn.click()
for page in range(5):
# 模拟拖动滚动条到浏览器底部
for i in range(5):
driver.execute_script(‘window.scrollTo(0,document.doby.scrollHeight):’)
time.sleep(random.random() + 1)
# 商品信息处理
ls = driver.find_element_by_css_selector(’.gl_item’)
for info in ls:
# 提取商品标题
title = info.find_element_by_css_selector(’.p-name.p-name-type-2 a’).text.strip()
print(‘title:’, title)
# 提取商品价格
price = info.find_element_by_css_selector(‘div.p-price > strong > i’).text.strip()
print(‘price:’, price)
# 提取店铺名称
shop = info.find_element_by_css_selector(‘span.J_im_icon > a’).text.strip()
print(‘shop:’, shop)
# 提取评价数据量
comments = info.find_element_by_css_selector(‘div.p-commit > strong > a’).text.strip()
print(‘comments:’, comments)
print(’=’ * 200)
# 翻页
time.sleep(random.random() * 2)
btn_next = driver.find_element_by_css_selector(‘a.pn-next’)
btn_next.click()
关闭浏览器
driver.close()