java-BufferedImage 图片验证码去除干扰线的方法( 用于OCR tesseract图像智能字符识别)

最近工作需要做了一下图片验证码自动识别的功能。但是网上对于初始图片的处理方法有去噪点、灰度化等,唯独难搜到去除干扰线的方法。于是根据网上搜来的代码,自己尝试写了一段,亲测有效,可以比较干净地去除干扰线,提高OCR识别的准确率。

  • 以下代码除“去除干扰线条“”一小段为原创,其他均为网上搜寻所得,但是很抱歉我忘记了来源网址,以后如果能找到再补上。在此先谢过慷慨分享原始代码的前辈!

demo如下:

import java.awt.Color;
import java.awt.image.BufferedImage;
import java.io.File;
import java.io.IOException;


import javax.imageio.ImageIO;


public class CopyOfCleanLines {

      public static void main(String[] args) throws IOException  
        {    
            File testDataDir = new File("imgWithLines");  
            final String destDir = testDataDir.getAbsolutePath()+"/tmp";  
            for (File file : testDataDir.listFiles())  
            {  
                cleanLinesInImage(file, destDir);  
                cleanLinesInImage(file, destDir); 
                cleanLinesInImage(file, destDir);
            }  
        }  

      /** 
         *  
         * @param sfile 
         *            需要去噪的图像 
         * @param destDir 
         *            去噪后的图像保存地址 
         * @throws IOException 
         */  
        public static void cleanLinesInImage(File sfile, String destDir)  throws IOException{  
            File destF = new File(destDir);  
            if (!destF.exists())  
            {  
                destF.mkdirs();  
            }  

            BufferedImage bufferedImage = ImageIO.read(sfile);  
            int h = bufferedImage.getHeight();  
            int w = bufferedImage.getWidth();  

            // 灰度化  
            int[][] gray = new int[w][h];  
            for (int x = 0; x < w; x++)  
            {  
                for (int y = 0; y < h; y++)  
                {  
                    int argb = bufferedImage.getRGB(x, y);  
                    // 图像加亮(调整亮度识别率非常高)  
                    int r = (int) (((argb >> 16) & 0xFF) * 1.1 + 30);  
                    int g = (int) (((argb >> 8) & 0xFF) * 1.1 + 30);  
                    int b = (int) (((argb >> 0) & 0xFF) * 1.1 + 30);  
                    if (r >= 255)  
                    {  
                        r = 255;  
                    }  
                    if (g >= 255)  
                    {  
                        g = 255;  
                    }  
                    if (b >= 255)  
                    {  
                        b = 255;  
                    }  
                    gray[x][y] = (int) Math  
                            .pow((Math.pow(r, 2.2) * 0.2973 + Math.pow(g, 2.2)  
                                    * 0.6274 + Math.pow(b, 2.2) * 0.0753), 1 / 2.2);  
                }  
            }  

            // 二值化  
            int threshold = ostu(gray, w, h);  
            BufferedImage binaryBufferedImage = new BufferedImage(w, h, BufferedImage.TYPE_BYTE_BINARY);  
            for (int x = 0; x < w; x++)  
            {  
                for (int y = 0; y < h; y++)  
                {  
                    if (gray[x][y] > threshold)  
                    {  
                        gray[x][y] |= 0x00FFFF;  
                    } else  
                    {  
                        gray[x][y] &= 0xFF0000;  
                    }  
                    binaryBufferedImage.setRGB(x, y, gray[x][y]);  
                }  
            }  

            //去除干扰线条
            for(int y = 1; y < h-1; y++){
                for(int x = 1; x < w-1; x++){                   
                    boolean flag = false ;
                    if(isBlack(binaryBufferedImage.getRGB(x, y))){
                        //左右均为空时,去掉此点
                        if(isWhite(binaryBufferedImage.getRGB(x-1, y)) && isWhite(binaryBufferedImage.getRGB(x+1, y))){
                            flag = true;
                        }
                        //上下均为空时,去掉此点
                        if(isWhite(binaryBufferedImage.getRGB(x, y+1)) && isWhite(binaryBufferedImage.getRGB(x, y-1))){
                            flag = true;
                        }
                        //斜上下为空时,去掉此点
                        if(isWhite(binaryBufferedImage.getRGB(x-1, y+1)) && isWhite(binaryBufferedImage.getRGB(x+1, y-1))){
                            flag = true;
                        }
                        if(isWhite(binaryBufferedImage.getRGB(x+1, y+1)) && isWhite(binaryBufferedImage.getRGB(x-1, y-1))){
                            flag = true;
                        } 
                        if(flag){
                            binaryBufferedImage.setRGB(x,y,-1);                     
                        }
                    }
                }
            }


            // 矩阵打印  
            for (int y = 0; y < h; y++)  
            {  
                for (int x = 0; x < w; x++)  
                {  
                    if (isBlack(binaryBufferedImage.getRGB(x, y)))  
                    {  
                        System.out.print("*");  
                    } else  
                    {  
                        System.out.print(" ");  
                    }  
                }  
                System.out.println();  
            }  

            ImageIO.write(binaryBufferedImage, "jpg", new File(destDir, sfile  
                    .getName()));  
        }  

        public static boolean isBlack(int colorInt)  
        {  
            Color color = new Color(colorInt);  
            if (color.getRed() + color.getGreen() + color.getBlue() <= 300)  
            {  
                return true;  
            }  
            return false;  
        }  

        public static boolean isWhite(int colorInt)  
        {  
            Color color = new Color(colorInt);  
            if (color.getRed() + color.getGreen() + color.getBlue() > 300)  
            {  
                return true;  
            }  
            return false;  
        }  

        public static int isBlackOrWhite(int colorInt)  
        {  
            if (getColorBright(colorInt) < 30 || getColorBright(colorInt) > 730)  
            {  
                return 1;  
            }  
            return 0;  
        }  

        public static int getColorBright(int colorInt)  
        {  
            Color color = new Color(colorInt);  
            return color.getRed() + color.getGreen() + color.getBlue();  
        }  

        public static int ostu(int[][] gray, int w, int h)  
        {  
            int[] histData = new int[w * h];  
            // Calculate histogram  
            for (int x = 0; x < w; x++)  
            {  
                for (int y = 0; y < h; y++)  
                {  
                    int red = 0xFF & gray[x][y];  
                    histData[red]++;  
                }  
            }  

            // Total number of pixels  
            int total = w * h;  

            float sum = 0;  
            for (int t = 0; t < 256; t++)  
                sum += t * histData[t];  

            float sumB = 0;  
            int wB = 0;  
            int wF = 0;  

            float varMax = 0;  
            int threshold = 0;  

            for (int t = 0; t < 256; t++)  
            {  
                wB += histData[t]; // Weight Background  
                if (wB == 0)  
                    continue;  

                wF = total - wB; // Weight Foreground  
                if (wF == 0)  
                    break;  

                sumB += (float) (t * histData[t]);  

                float mB = sumB / wB; // Mean Background  
                float mF = (sum - sumB) / wF; // Mean Foreground  

                // Calculate Between Class Variance  
                float varBetween = (float) wB * (float) wF * (mB - mF) * (mB - mF);  

                // Check if new maximum found  
                if (varBetween > varMax)  
                {  
                    varMax = varBetween;  
                    threshold = t;  
                }  
            }  

            return threshold;  
        }  
}
  • 5
    点赞
  • 19
    收藏
    觉得还不错? 一键收藏
  • 1
    评论
以下是一个简单的Java代码示例,演示了如何使用Tesseract OCR库和iText库实现OCR识别图片并转换成双层PDF: ```java import java.io.File; import java.io.FileOutputStream; import java.io.IOException; import javax.imageio.ImageIO; import com.itextpdf.awt.DefaultFontMapper; import com.itextpdf.text.Document; import com.itextpdf.text.PageSize; import com.itextpdf.text.Rectangle; import com.itextpdf.text.pdf.PdfContentByte; import com.itextpdf.text.pdf.PdfLayer; import com.itextpdf.text.pdf.PdfLayerMembership; import com.itextpdf.text.pdf.PdfName; import com.itextpdf.text.pdf.PdfWriter; import net.sourceforge.tess4j.Tesseract; import net.sourceforge.tess4j.TesseractException; import net.sourceforge.tess4j.util.ImageHelper; public class OCRToPDF { public static void main(String[] args) { // 读取图片文件 File imageFile = new File("input.png"); // 定义输出PDF文件 File pdfFile = new File("output.pdf"); // 创建Tesseract OCR对象 Tesseract tesseract = new Tesseract(); // 设置OCR语言为英语 tesseract.setLanguage("eng"); try { // 读取图片并转换为灰度图像 BufferedImage image = ImageIO.read(imageFile); BufferedImage grayImage = ImageHelper.convertImageToGrayscale(image); // 进行OCR识别 String result = tesseract.doOCR(grayImage); // 创建PDF文档 Document document = new Document(PageSize.A4); // 创建PDF写入器 PdfWriter writer = PdfWriter.getInstance(document, new FileOutputStream(pdfFile)); // 打开文档 document.open(); // 创建图层 PdfContentByte canvas = writer.getDirectContent(); PdfLayer imageLayer = new PdfLayer("Image Layer", writer); PdfLayer textLayer = new PdfLayer("Text Layer", writer); // 将图像添加到图像层 PdfLayerMembership imageMembership = new PdfLayerMembership(writer); imageMembership.addMember(imageLayer); canvas.beginLayer(imageMembership); canvas.drawImage(Image.getInstance(imageFile.getAbsolutePath()), 0, 0, PageSize.A4.getWidth(), PageSize.A4.getHeight()); canvas.endLayer(); // 将OCR识别文本添加到文本层 PdfLayerMembership textMembership = new PdfLayerMembership(writer); textMembership.addMember(textLayer); canvas.beginLayer(textMembership); canvas.beginText(); canvas.setFontAndSize(DefaultFontMapper.getAModelFont("Arial", false), 12); canvas.showTextAligned(result, 100, 100, PdfContentByte.ALIGN_LEFT); canvas.endText(); canvas.endLayer(); // 关闭文档 document.close(); } catch (IOException e) { e.printStackTrace(); } catch (TesseractException e) { e.printStackTrace(); } catch (Exception e) { e.printStackTrace(); } } } ``` 请注意,此示例代码仅提供了基本的实现方法。在实际应用中,您需要根据具体需求进行更细粒度的调整和优化。

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值