主要逻辑
- 打开首页
- 搜索关键字,进入第一页
2.1 获取详情页url
2.2 进入详情页抓取数据 - 翻页,重复第二步
详细代码
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from bs4 import BeautifulSoup as bs
import time
class ZhiPin:
def __init__(self):
self.start_url = 'https://www.zhipin.com/'
self.driver = webdriver.Chrome()
def search(self, kw):
element = self.driver.find_element_by_class_name('ipt-search')
element.send_keys(kw)
element.send_keys(Keys.RETURN)
self.driver.find_element_by_link_text('全国')