import requests
from bs4 import BeautifulSoup
import openpyxl
# 定义爬取的关键词和页数
keyword = '机器视觉工程师'
pages = 30
# 创建Excel工作簿和工作表
wb = openpyxl.Workbook()
ws = wb.active
ws.title = 'Salary'
# 写入表头
ws['A1'] = '公司名称'
ws['B1'] = '招聘条件'
ws['C1'] = '薪资待遇'
# 循环爬取每一页的数据
for page in range(1, pages+1):
# 构造请求URL
url = f'https://fe-api.zhaopin.com/c/i/sou?pageSize=60&cityId=538&workExperience=-1&education=-1&companyType=-1&employmentType=-1&jobWelfareTag=-1&kw={keyword}&kt=3&=0&_v=0.83752170&x-zp-page-request-id=5d0f5a4d0c374e2c8e9a9f1f2b78d7c9-1625026694259-75501&x-zp-client-id=8a905e1c-2c14-4f5d-9b7d-1f3a05e9d3b4&pageNo={page}&suid=5d0f5a4d0c374e2c8e9a9f1f2b78d7c9&_=0'
# 发送请求
response = requests.get(url)
# 解析响应内容
soup = BeautifulSoup(response.text, 'html.parser')
# 获取职位列表
job_list = soup.find_all('div', class_='joblist-box__item')
# 循环处理每一个职位信息
for job in job_list:
# 获取公司名称
company = job.find('a', class_='joblist-box__body__item__info__name')['title']
# 获取招聘条件
condition = job.find('div', class_='joblist-box__body__item__info__job__demand')['title']
# 获取薪资待遇
salary = job.find('span', class_='joblist-box__body__item__info__job__saray').text.strip()
# 将数据写入Excel表格
ws.append([company, condition, salary])
# 按照薪资水平从高到低排序
ws.auto_filter.ref = ws.dimensions
ws.auto_filter.add_sort_condition('C2:C1000', descending=True)
# 保存Excel文件
wb.save('salary.xlsx')
从招聘网站爬取公司名称、招聘条件和薪资待遇
最新推荐文章于 2024-08-08 14:28:23 发布