CSDN的第一篇,希望以后能接着写。
import requests
import json
import pandas as pd
def listname(iname):
name=[]
cardNum=[]
areaName=[]
for i in range(0,100):
url='https://sp0.baidu.com/8aQDcjqpAAV3otqbppnN2DJv/api.php'
para={
'pn': str(i*10),
'resource_id':'6899',
'query':'失信被执行人名单',
'iname': iname,
'rn':'10',
'ie':'utf-8',
'oe':'utf-8',
'format':'json',
'cb':'cb=jQuery110204669623007201096_1546820149157'
}
head={
"Host": "sp0.baidu.com",
"Accept": "*/*",
"Connection": "keep-alive",
"Accept-Encoding": "gzip, deflate, br",
'Accept-Language': 'zh-CN,zh;q=0.8',
'Referer':'https://www.baidu.com/s?wd=%E5%A4%B1%E4%BF%A1%E4%BA%BA',
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.75 Safari/537.36'
}
rep=requests.get(url,headers=head,params=para)
rep_str=rep.content.decode()
rep_json=json.loads(rep_str[7:-2])
rep_data=rep_json['data']
for each in rep_data:
for data in each['result']:
name.append(data['iname'])
cardNum.append(data['cardNum'])
areaName.append(data['areaName'])
result_all=pd.DataFrame({'Name':iname,'IDcard':cardNum,'Area':areaName})
result_signal=result_all.drop_duplicates()
result=result_signal.reset_index(drop=True)
return result
print(listname('XXX))