playwright+opencv 过滑块拼图验证码

肆拾書時

已于 2024-07-01 16:27:18 修改

阅读量1.5k

点赞数 1

文章标签： opencv 人工智能计算机视觉

于 2023-07-14 17:14:21 首次发布

本文链接：https://blog.csdn.net/chenhens/article/details/131728108

版权

本文介绍了如何结合Python的Playwright框架和OpenCV库来自动化处理浏览器中的拼图验证码。通过图像处理技术，如边缘检测和形状匹配，定位并识别验证码图像，从而实现模拟登录过程中的拼图验证。虽然目前的识别率尚可，但提高边缘检测的准确度仍是优化的重点。

摘要由CSDN通过智能技术生成

前言

最近看到浏览器自动化框架playwright，就使用了一下
在模拟登录掘金是通过密码登陆时遇到需要通过拼图验证码

于是通过查找发现可以通过opencv库解决问题下面是解决过程

过程

1.首先需要获取到图片，通过查看html可以很容易找到需要的图片

2.通过opencv进行图像处理来获取到拼图所处的位置

1.通过查找搜索了解到可以通过边缘检测和形状匹配获取到拼图所处的位置，代码如下

import cv2

image1 = cv2.imread("resources/t4.jpeg")
image1_resize = cv2.resize(image1, (340, 212))
image2 = cv2.imread("resources/t4.png")
image2_resize = cv2.resize(image2, (68, 68))

# 背景图
# 处理图像，保留大部分白色
ret, thresholded_image = cv2.threshold(image1_resize, 220, 255, cv2.THRESH_BINARY)
# 灰度图像
gray_image1 = cv2.cvtColor(thresholded_image, cv2.COLOR_BGR2GRAY)
# 提高对比度
denoised_image1 = cv2.equalizeHist(gray_image1)
# 边缘检测
edges = cv2.Canny(denoised_image1, threshold1=500, threshold2=900)

# 滑块图片
gray_image2 = cv2.cvtColor(image2_resize, cv2.COLOR_BGR2GRAY)
denoised_image2 = cv2.equalizeHist(gray_image2)
edges2 = cv2.Canny(denoised_image2, threshold1=650, threshold2=900)

# 进行形状匹配
result = cv2.matchTemplate(edges, edges2, cv2.TM_CCOEFF_NORMED)
min_val, max_val, min_loc, max_loc = cv2.minMaxLoc(result)
top_left2 = max_loc
bottom_right2 = (top_left2[0] + edges2.shape[1], top_left2[1] + edges2.shape[0])

# 在输入图像上绘制矩形标记
cv2.rectangle(image1_resize, top_left2, bottom_right2, (0, 0, 255), 2)

cv2.imshow("denoised_image2", denoised_image2)
cv2.imshow("edges2", edges2)
cv2.imshow("denoised_image1", denoised_image1)
cv2.imshow("edges", edges)
cv2.imshow('Target Image', image1_resize)


cv2.waitKey(0)

2.分析过程

首先灰度处理图像
cv2.cvtColor(thresholded_image, cv2.COLOR_BGR2GRAY)

其次对图像进行边缘检测
cv2.Canny(denoised_image1, threshold1=500, threshold2=900)

可以看到提取到了拼图的形状
最后通过cv2.matchTemplate(edges, edges2, cv2.TM_CCOEFF_NORMED)进行形状匹配

通过上述操作就可以大致获取到拼图所处的位置
3.总结
感觉以上内容主要难点是如何提高边缘检测的准确度，更好的显示拼图形状，这方面是需要优化的

运行效果

[外链图片转存失败,源站可能有防盗链机制,建议将图片保存下来直接上传(img-D3CqEYwS-1689326000217)(https://p9-juejin.byteimg.com/tos-cn-i-k3u1fbpfcp/feb5937099224f3b93e1d4b7b8a25b50~tplv-k3u1fbpfcp-watermark.image?)]

完整代码

import random
import time

from playwright.sync_api import sync_playwright
import cv2
import requests


def get_move_x(image_path, template_path, image_height, image_width, template_height, template_width):
    # 背景图
    image = cv2.imread(image_path)
    image_resize = cv2.resize(image, (image_width, image_height))
    # 处理图像，保留大部分白色
    ret, thresholded_image = cv2.threshold(image_resize, 220, 255, cv2.THRESH_BINARY)
    # 灰度图像
    gray_image1 = cv2.cvtColor(thresholded_image, cv2.COLOR_BGR2GRAY)
    # 提高对比度
    denoised_image1 = cv2.equalizeHist(gray_image1)
    # 边缘检测
    image_canny = cv2.Canny(denoised_image1, threshold1=500, threshold2=900)

    # 滑动图
    template = cv2.imread(template_path)
    template_resize = cv2.resize(template, (template_width, template_height))
    template_gray = cv2.cvtColor(template_resize, cv2.COLOR_BGR2GRAY)
    denoised_image2 = cv2.equalizeHist(template_gray)
    template_canny = cv2.Canny(denoised_image2, threshold1=650, threshold2=900)

    # 进行模板匹配
    result = cv2.matchTemplate(image_canny, template_canny, cv2.TM_CCOEFF_NORMED)

    # 获取匹配结果的位置
    min_val, max_val, min_loc, max_loc = cv2.minMaxLoc(result)

    top_left2 = max_loc
    bottom_right2 = (top_left2[0] + template_resize.shape[1], top_left2[1] + template_resize.shape[0])
    # 在输入图像上绘制矩形标记
    cv2.rectangle(image_resize, top_left2, bottom_right2, (0, 0, 255), 2)
    cv2.imwrite('./test/Result'+str(int(time.time()))+'.jpg', image_resize)
    # x位置
    return max_loc[0]


with sync_playwright() as p:
    browser = p.chromium.launch(headless=False)
    context = browser.new_context()
    page = browser.new_page()
    page.goto("https://juejin.cn/")
    page.wait_for_timeout(1000)
    page.get_by_role("button", name="登录 注册").click()
    page.wait_for_timeout(1000)
    page.get_by_text("密码登录").click()
    page.wait_for_timeout(1000)
    page.get_by_placeholder("请输入邮箱/手机号（国际号码加区号）").click()
    page.wait_for_timeout(1000)
    page.get_by_placeholder("请输入邮箱/手机号（国际号码加区号）").fill("11111111111")
    page.wait_for_timeout(1000)
    page.get_by_placeholder("请输入密码").click()
    page.wait_for_timeout(1000)
    page.get_by_placeholder("请输入密码").fill("1933waH+")
    page.wait_for_timeout(1000)
    page.get_by_role("button", name="登录", exact=True).click()

    login_flag = False
    count = 2
    while not login_flag and count>0:
        # 背景图的设置
        imageEL = page.locator("#captcha-verify-image")
        # 保存图片
        resp = requests.get(imageEL.get_attribute("src"))
        with open('bg.jpeg', 'wb') as f:
            f.write(resp.content)
        # 滑动图
        templateEl = page.locator("#captcha_container img").nth(1)
        # 保存图片
        resp = requests.get(templateEl.get_attribute("src"))
        with open('template.png', 'wb') as f:
            f.write(resp.content)
        #  获取滑动距离
        image_height = imageEL.bounding_box()["height"]
        image_width = imageEL.bounding_box()["width"]
        template_height = templateEl.bounding_box()["height"]
        template_width = templateEl.bounding_box()["width"]
        # print(image_height, image_width, template_height, template_width)
        x = get_move_x("bg.jpeg", "template.png", image_height, image_width, 68, 68)
        # x 加偏移量
        x = x + 33
        print(x)
        box = page.locator("div").filter(has_text="按住左边按钮拖动完成上方拼图").nth(4).bounding_box()
        page.locator("#secsdk-captcha-drag-wrapper div").nth(1).hover()
        page.mouse.down()
        # 移动鼠标
        #  生成30次移动x轴的坐标
        start = 1
        end = x
        step = (end - start) / 29  # 计算递增步长
        for i in range(30):
            if i == 29:
                number = x
            else:
                number = start + i * step
            page.mouse.move(box["x"] + number, box["y"] + random.randint(-10, 10), steps=4)
        page.mouse.up()

        page.wait_for_timeout(2000)
        try:
            page.locator("a").filter(has_text="刷新").wait_for(timeout=1000)
            count = count - 1
        except Exception as e:
            print("登录成功")
            login_flag = True

    # 签到
    # page.get_by_role("button", name="去签到").click()
    # page.get_by_role("button", name="立即签到").click()
    # page.get_by_role("button", name="去抽奖").click()
    # page.locator("#turntable-item-0").click()
    # page.get_by_role("button", name="收下奖励").click()
    # 已签到
    # page.get_by_role("button", name="已签到").click()
    # page.get_by_role("button", name="今日已签到").click()
    # page.get_by_role("button", name="去抽奖").click()
    # page.locator("#turntable-item-0").click()
    # page.get_by_role("button", name="收下奖励").click()
    page.pause()
    # page.close()
    # browser.close()

其他

模拟拖动时，拖拽轨迹不能一条直线会被检测的，最好接近人的拖拽

多次模拟看起来识别率还可以

肆拾書時

关注

1
点赞
踩
6

收藏

觉得还不错? 一键收藏
2
评论
playwright+opencv 过滑块拼图验证码

最近看到浏览器自动化框架playwright，就使用了一下在模拟登录掘金是通过密码登陆时遇到需要通过拼图验证码于是通过查找发现可以通过opencv库解决问题下面是解决过程。
复制链接

扫一扫