Python爬虫:验证码识别登录
获取验证码图片
import requests
from lxml import etree
url='https://so.gushiwen.org/user/login.aspx?from='
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/89.0.4389.90 Safari/537.36'
}
img_code_text=requests.get(url=url,headers=headers).text
tree=etree.HTML(img_code_text)
img_src_url='https://so.gushiwen.org'+tree.xpath('//*[@id="imgCode"]/@src')[0]
img_data=requests.get(url=img_src_url,headers=headers).content
with open('./code.jpg','wb')as fp:
fp.write(img_data)
# print('存储成功')
超级鹰平台识别验证码图片
登录超级鹰官网,注册一个账号和密码,并在用户中心>>软件ID 生成一个软件ID
#!/usr/bin/env python
# coding:utf-8
import requests
from hashlib import md5
class Chaojiying_Client(object):
def __init__(self, username, password, soft_id):
self.username = username
#更改点1
password = password.encode('utf-8')
self.password = md5(password).hexdigest()
self.soft_id = soft_id
self.base_params = {
'user': self.username,
'pass2': self.password,
'softid&#