-
下载
点我下载
提取码:sukc -
安装
一路下一步即可(记住安装路径) -
配置
变量名:TESSDATA_PREFIX
变量值:C:\Program Files\Tesseract-OCR\tessdata(根据自己的安装路径更改)
再配置Path值
值:C:\Program Files\Tesseract-OCR
重启pycharm! -
代码
import pytesseract
from PIL import Image
from selenium import webdriver
#选择的浏览器
driver = webdriver.Firefox()
#访问的网址
driver.get("http://demo.tomexam.com/login.thtml")
driver.maximize_window()#全屏
driver.implicitly_wait(10)
driver.save_screenshot('screenshot.png')
driver.save_screenshot("code.png")
driver.find_element_by_name("username").send_keys("admin1")
driver.find_element_by_name("userpass").send_keys("admin1")
#定位要截取图片的元素位置
element = driver.find_element_by_xpath('//*[@id="img_verifycode"]')
#截取图片
# e.screenshot("code.png")
#图片坐标
locations = element.location
print(locations)
#图片大小
sizes = element.size
print(sizes)
# 构造指数的位置
x1 = element.location['x']
y1 = element.location['y']
x2 = element.location['x'] + element.size['width']
y2 = element.location['y'] + element.size['height']
print(x1,y1,x2,y2)
# 打开截图切割
img = Image.open("code.png")
jpg = img.crop((x1,y1,x2,y2))
jpg.save("code1.png")
image = Image.open("code1.png")
#识别图片
text = pytesseract.image_to_string(image, lang = 'eng')
print(text)
driver.find_element_by_xpath("html/body/div[1]/div[1]/table/tbody/tr[3]/td/input").send_keys(text)