======================1.爬取抽屉网信息(json数据)==========================
import requests from fake_useragent import UserAgent agent = UserAgent() import json # # # 不要重复造轮子 # # pip search 工具包名字 # # # pip install fake_useragent # url = "https://dig.chouti.com/getTopTenLinksOrComments.json?_=1529764992551" # # 通过浏览器获取的操作一般都是get请求 headers = { "Host":"dig.chouti.com", "User-Agent":"Mozilla/5.0 (Windows NT 6.1; WOW64; rv:53.0) Gecko/20100101 Firefox/53.0", "Accept": "application/json,text/javascript,*/*; q=0.01", "Accept-Language": "zh-CN,zh;q=0.8,en-US;q=0.5,en;q=0.3", "Accept-Encoding":"gzip,deflate, br", "X-Requested-With":"XMLHttpRequest", "Referer":"https://dig.chouti.com/", "Cookie":"gpsd=0b08b9f5b945fd53eac7868a2e8945a8;JSESSIONID=aaazCSOWV2s7FcALFeHqw;gpid=55eaeb947f15445b82467624c476521f;_pk_id.1.a2d5=dbeb24b52f36519f.1529741245.1.1529741290.1529741245.;_pk_ses.1.a2d5=*", "Connection":"keep-alive"} data = {"_":"1529742010062"} res = requests.post(url, headers=headers, data=data) rs_js = json.loads(res.content) print(rs_js['result']['data'])