import urllib from urllib import request,parse import json headers={ "User-Agent": "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Mobile Safari/537.36" } #获取python岗位 def GetPython(starurl,data): url = starurl #url编码 data = urllib.parse.urlencode(data).encode('utf-8') req = urllib.request.Request(url, data = data, headers = headers) response = urllib.request.urlopen(req) response = response.read().decode('utf-8') response = json.loads(response) # print(response) # 获取职位信息 returnValue = response['returnValue']['datas'] for i in returnValue: # 获取职位信息 departmentName = i['departmentName'] # 获取工作地方 workLocation = i['workLocation'] #获取学历要求 degree = i['degree'] print(departmentName,workLocation,degree) # 获取全部岗位 def GetAll(url): data = { "pageSize": "10", "t": "0.4097248009187844", "pageIndex": "1" } # 获取全部岗位数量页数 data = urllib.parse.urlencode(data).encode('utf-8') req = urllib.request.Request(url, data, headers) response = urllib.request.urlopen(req).read() data = json.loads(response) totalPage = data['returnValue']['totalPage'] for p in range(1, int(totalPage) + 1): data = { "pageSize": "10", "t": "0.4097248009187844", "pageIndex": str(p) } # 获取全部岗位数量页数 data = urllib.parse.urlencode(data).encode('utf-8') req = urllib.request.Request(url, data, headers) response = urllib.request.urlopen(req).read() returnValue = json.loads(response)['returnValue']['datas'] # print(returnValue) for job in returnValue: # 部门 departmentName = job['departmentName'] # 要求 description = job['description'] print(departmentName, description) if __name__ == '__main__': # pass starurl = 'https://job.alibaba.com/zhaopin/socialPositionList/doList.json' data = { "pageSize": "10", "t": "0.5203601518784822", "keyWord": "python", "pageIndex":1 } # GetPython(starurl,data) GetAll(starurl)
爬取某里的社招网python岗位及全部岗位
最新推荐文章于 2022-10-07 21:50:05 发布