1、环境
pycharm+selenium+pyquery+openpyxl
2、功能说明
通过openpyxl读取关键词,爬取亚马逊指定关键词商品 的信息,并将获取到的信息通过openpyxl写入到excel中
3、完整代码
import time
from selenium import webdriver
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as ec
from selenium.webdriver.common.desired_capabilities import DesiredCapabilities
from selenium.webdriver.common.by import By
from pyquery import PyQuery as Pq
import openpyxl
def parse_detail(page_source, page_index,key):
global write_row
isEnd = False
doc = Pq(page_source)
# 判断是否为最后一页,最后一页就停止往下获取
last = doc('.a-disabled.a-last').text()
if last.strip() != "":
isEnd = True
print("last text = ",last," isEnd = ",isEnd)
# 获取商品所有信息
main_list = doc('.s-main-slot.s-result-list.s-search-results.sg-row')
par_list = main_list.children().items()
normal_count = 0
for child in par_list:
#

最低0.47元/天 解锁文章

1059

被折叠的 条评论
为什么被折叠?



