【python 图像识别】python 身份证号码识别

最新推荐文章于 2025-03-12 13:59:27 发布

置顶东华果汁哥

最新推荐文章于 2025-03-12 13:59:27 发布

阅读量3.6w

点赞数 19

分类专栏：数据科学--python 文章标签： python 身份证识别

本文链接：https://blog.csdn.net/u013421629/article/details/72677964

版权

数据科学--python 专栏收录该内容

289 篇文章

订阅专栏

一、需求分析
识别身份证图片上的身份证号码。
如：
这里写图片描述

二、python实现源代码

# !/usr/bin/python
#-*-coding:utf-8-*-
import sys
reload(sys)
sys.setdefaultencoding('utf-8')

import time
time1 = time.time()
from PIL import Image
import pytesseract

###########二值化算法
def binarizing(img,threshold):
    pixdata = img.load()
    w, h = img.size
    for y in range(h):
        for x in range(w):
            if pixdata[x, y] < threshold:
                pixdata[x, y] = 0
            else:
                pixdata[x, y] = 255
    return img


###########去除干扰线算法
def depoint(img):   #input: gray image
    pixdata = img.load()
    w,h = img.size
    for y in range(1,h-1):
        for x in range(1,w-1):
            count = 0
            if pixdata[x,y-1] > 245:
                count = count + 1
            if pixdata[x,y+1] > 245:
                count = count + 1
            if pixdata[x-1,y] > 245:
                count = count + 1
            if pixdata[x+1,y] > 245:
                count = count + 1
            if count > 2:
                pixdata[x,y] = 255
    return img


########身份证号码识别
def identity_OCR(pic_path):
    #####身份证号码截图
    img1=Image.open(pic_path)
    w,h=img1.size
    ##将身份证放大3倍
    out=img1.resize((w*3,h*3),Image.ANTIALIAS)
    region = (125*3,200*3,370*3,250*3)
    #裁切身份证号码图片
    cropImg = out.crop(region)
    # 转化为灰度图
    img= cropImg.convert('L')
    # 把图片变成二值图像。
    img1=binarizing(img,100)
    img2=depoint(img)
    code = pytesseract.image_to_string(img2)
    print "识别该身份证号码是:"+str(code)



if __name__ == '__main__':
    pic_path="/root/image/331.jpg"
    identity_OCR(pic_path)
    time2 = time.time()
    print u'总共耗时：' + str(time2 - time1) + 's'