#环境python3.6
# 爬取APP 无忧借条
# 通过用户账号密码爬取用户个人信息(我这账号密码已打码)
爬虫部分代码
# coding:utf8
import hashlib
import time
import urllib3
import json
headers = {'Accept': ' */*', 'Accept-Encoding': 'gzip, deflate', 'Accept-Language': 'zh-CN,en-US;q=0.8',
'User-Agent': 'Mozilla/5.0 (Linux; Android 6.0.1; Redmi 3S Build/MMB29M; wv) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/53.0.2785.49 Mobile MQQBrowser/6.2 TBS/043632 Safari/537.36 jinjiedao'}
origin_data = {} # 原始数据
result={} #提取后数据
http = urllib3.PoolManager() # http连接池
urllib3.disable_warnings() #禁用各种urllib3警告
# 获取token
def login(phone,password):
login_url='https://www.gushistory.com/jjdApi/user/login'
headers['refer'] = 'https://www.gushistory.com/jjdapp/html/register/login.html?telephone=' + phone
md5 = hashlib.md5()
md52 = hashlib.md5()
md5.update(password.encode(encoding='utf-8')) # 第一次md5
md52.update(md5.hexdigest().encode(encoding='utf-8')) # 第二次md5
# 创建登陆参数字典
data={'c_telephone': phone, 'c_pwd': md52.hexdigest()}
response=excute(login_url,'GET',data)
origin_data['login'] = response
return response['token']
# 获取登陆后的信息
def getAccountInfo(token):
account_url='https://www.gushistory.com/jjdApi/user/getHomepageInfo'
headers['refer'] = 'https://www.gushistory.com/jjdapp/html/index.html'
data = {'token': token}
response = excute(account_url, 'GET', data)
origin_data['account'] = response
user_info = response['userInfo']
result['balance'] = user_i