一个简单的用chromedrive实现自动登录并且破解登录的验证码

最新推荐文章于 2024-06-02 20:55:15 发布

yangbenhao

最新推荐文章于 2024-06-02 20:55:15 发布

阅读量3.9k

点赞数

分类专栏： python爬虫小程序文章标签：登录打码

本文链接：https://blog.csdn.net/yangbenhao/article/details/81937842

版权

python爬虫小程序专栏收录该内容

2 篇文章 0 订阅

订阅专栏

from selenium import webdriver
import time
import requests
from lxml import etree
import base64
#操作浏览器
def getheaders():
    driver = webdriver.Chrome()
    #这是要访问的网站
    url = 'https://accounts.douban.com/login?alias=&redir=https%3A%2F%2Fwww.douban.com%2F&source=index_nav&error=1001'
    time.sleep(2)
    #访问网站
    driver.get(url)
    time.sleep(2)
    #找到地方放入登录用户名密码
    driver.find_element_by_id('email').send_keys('******')
    driver.find_element_by_id('password').send_keys('******')
    #有验证码的情况
    try:
        #用xpath定位到验证码图片
        html_ele = etree.HTML(driver.page_source)
        html_img = html_ele.xpath('//img[@id="captcha_image"]/@src')[0]
        #获取图片的内容
        response = requests.get(html_img)
        #先用64把他转换成需要的格式
        b64_str = base64.b64encode(response.content)
        v_type = 'cn'
        # post 提交打码平台的数据
        form = {
            'v_pic': b64_str,
            'v_type': v_type,
        }
        #打码平台的headers
        headers = {
            'Authorization':'APPCODE 5c3fb1*****2c6b7e297cc7'
        }
        #阿里云打码的提交地址
        url = 'http://yzmplus.market.alicloudapi.com/fzyzm'
        #获取返回值的验证码
        response = requests.post(url,data=form,headers=headers)
        res_vcode = response.json()['v_code']
        print(res_vcode)
        #放入验证码到地方
        driver.find_element_by_id('captcha_field').send_keys(res_vcode)
    except:
        print('don`t need')
    #提交登录
    driver.find_element_by_class_name('btn-submit').click()


    #获取登录以后的cookie
    cookie = driver.get_cookies()
    print(cookie)
    #下面几步把cookie转换成自己需要的格式
    cookie_list = []
    for cookie_dict in cookie:
        cookie_res = cookie_dict['name'] +'='+ cookie_dict['value']
        cookie_list.append(cookie_res)
    cookie = ';'.join(cookie_list)

    headers = {
        'User-Agent':'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.106 Safari/537.36',
        'Cookie':cookie

    }

if __name__ == '__main__':
    headers = getheaders()

    #这个路径是登录过后的页面
    url_info = 'https://www.douban.com/people/183367314/'

    response = requests.get(url_info,headers=headers)

    with open('douban.html','wb')as f:
        f.write(response.content)

yangbenhao

关注

0
点赞
踩
2

收藏

觉得还不错? 一键收藏
0
评论
一个简单的用chromedrive实现自动登录并且破解登录的验证码

from selenium import webdriverimport timeimport requestsfrom lxml import etreeimport base64#操作浏览器def getheaders(): driver = webdriver.Chrome() #这是要访问的网站 url = 'https://accounts.douba...
复制链接

扫一扫