这是第三天爬的一个案例,大家注意:cookie失效会导致代码运行的时候失效,大家自己替换就好,反正截止到目前运行为止是成功的:
代码如下:
# 延时防止Ip被封,同时写入CSV文件中
import requests
import time,csv,pprint,re,json
# https://www.zhipin.com/c100010000/?query=Web%E5%89%8D%E7%AB%AF&page=4
url = "https://www.zhipin.com/c100010000/?query=Web%E5%89%8D%E7%AB%AF"
cookie_str = "lastCity=101280100; __c=1579014251; __g=-; Hm_lvt_194df3105ad7148dcf2b98a91b5e727a=1578649034,1578765623,1579014251; __l=l=%2Fwww.zhipin.com%2Fguangzhou%2F&r=https%3A%2F%2Fcn.bing.com%2F&friend_source=0&friend_source=0; __a=58611270.1578649034.1578765623.1579014251.48.3.4.48; Hm_lpvt_194df3105ad7148dcf2b98a91b5e727a=1579014289; __zp_stoken__=9af4tzqlX58fbH%2Bf%2BsKBO%2ByL6anOmthiJ48g04bm4JIOvKd1PXCwoRlNJy0uVQIfwBjvkXSjsL1CbtGIyRY%2FSB7o98c8vMTZRvd3zeXK7Db2qjIEDsJQJl%2FbBjSKMCSZw6lI; __zp_sseed__=23gHsZTrFQC+PcxKy/4q0mEX