#!/usr/bin/env python
# -*- coding:utf-8 -*-
import pytesseract
from captcha.image import ImageCaptcha
import random
imageCaptcha = ImageCaptcha()
chars = []
# A ~ Z
for i in range(65,91):
chars.append(chr(i))
# a ~ z
for i in range(97,123):
chars.append(chr(i))
for i in range(10):
chars.append(str(i))
# 列表
code = random.choices(chars, k=4)
# 将列表转换为str
code = ''.join(code)
image = imageCaptcha.generate_image(code)
image = image.convert('L')
data = image.load()
# print(data[150,25])
w,h = image.size
for i in range(w):
for j in range(h):
print(data[i, j])
if data[i,j] >180:
# 255表示纯白
data[i,j] = 255
else:
# 0表示纯黑
data[i,j] = 0
image.show()
# 之所以没有识别,tesseract训练时候,给的数据方方正正
# 识别准确率提高,修改,captcha源码,将生成的图片,普通图片
str = pytesseract.image_to_string(image)
print(str)