相比现在这种验证码越来越多了,但是对于机器而言,也是秒攻破的,和其他的验证码无异,只需要高质量样本即可。
图一实测结果:
图三实测结果:
老样子,送一波采集代码(图一):
from utils import Project, ProxyType, ServiceType
class So(Project):
def __init__(self):
super().__init__()
self.service_type = ServiceType.Local19962
self.captcha_url = "https://www.so.com/index.php?c=index&a=getcode"
self.feedback_url = "https://www.so.com/index/antispider"
def captcha_process(self) -> bytes:
r = self.session.get(self.captcha_url, timeout=1)
return r.content
def feedback_process(self, captcha_text: str) -> bool:
print(captcha_text)
payload = {
"from": "http%3A%2F%2Fwww.so.com%2Fs%3Fq%3Djkjk%26src%3Dsrp%26fr%3Dnone%26psid%3Dfc12b9a1e9f5464ec8a9b37ec358a0db",
"rcode": captcha_text
}
r = self.session.post(self.feedback_url, data=payload, timeout=1)
r.encoding = "utf8"
# print(r.text)
if '请输入以下验证码继续使用360搜索' in r.text:
return False
else:
# print(r.text)
return True
if __name__ == '__main__':
project = So()
project.configuration(
proxy=ProxyType.none,
save_false=True,
)
project.start(num=500000)
pass
作者QQ:27009583