Java Tess4J OCR文字识别实现

博主： admin
发布时间：2022 年 04 月 10 日
692 次浏览
7972字数
分类： Java

Tess4J简介

Tesseract-OCR支持中文识别，并且开源和提供全套的训练工具，是快速低成本开发的首选。而Tess4J则是Tesseract在Java PC上的应用。在英文和数字识别中性能还是不错的，但是在中文识别中，无论速度还是识别率还是较弱，建议有条件的话，针对场景进行训练，会获得较好结果。
项目地址：https://github.com/tesseract-ocr
语言包下载地址：https://github.com/tesseract-ocr/tessdata

Demo

下面附上我自己的测试过程：
（1）新建一个SpringBoot工程，我用的版本是2.5.10。
（2）后端相关类和配置：

1、引入pom.xml配置：

Maven依赖

        <!-- ocr -->
        <dependency>
            <groupId>net.sourceforge.tess4j</groupId>
            <artifactId>tess4j</artifactId>
            <version>5.0.0</version>
        </dependency>
        <dependency>
            <groupId>net.java.dev.jna</groupId>
            <artifactId>jna-platform</artifactId>
            <version>5.11.0</version>
        </dependency>

2、相关Utils工具类：

ImgFileUtils

package com.ocr.utils;

import javax.imageio.ImageIO;
import java.awt.image.BufferedImage;
import java.io.File;
import java.io.IOException;
import java.io.OutputStream;

public class ImgFileUtils {
    
    /**
     * 存为PNG格式
     */
    public static void saveToFile(BufferedImage subimage, File file) throws IOException {
        ImageIO.write(subimage, "png", file);
    }
    
    /** 
     * 存为PNG格式 
     */
    public static void saveAsPNG(BufferedImage subimage, File file) throws IOException {
        ImageIO.write(subimage, "png", file);
    }
    
    /** 
     * 存为JPEG格式图像文件 
     */
    public static void saveAsJPEG(BufferedImage subimage, File file) throws IOException {
        ImageIO.write(subimage, "JPEG", file);
    }
    
    /** 
     * 写入一个OutputStream 
     */
    public static void write(BufferedImage subimage, OutputStream out) throws IOException {
        ImageIO.write(subimage, "png", out);
    }
    
}

ImgUtils

package com.ocr.utils;

import java.awt.image.BufferedImage;

public class ImgUtils {
    
    /**
     * 裁剪图片：去掉黑边
     */
    public static BufferedImage clipImage(BufferedImage srcImage) {
        return srcImage.getSubimage(8, 5, srcImage.getWidth() - 20, srcImage.getHeight() - 10);
    }
    
    /**
     * 灰度化
     */
    public static BufferedImage grayImage(BufferedImage srcImage) {
        return copyImage(srcImage, new BufferedImage(srcImage.getWidth(), srcImage.getHeight(), BufferedImage.TYPE_BYTE_GRAY));
    }
    
    /**
     * 二值化
     */
    public static BufferedImage binaryImage(BufferedImage srcImage) {
        return copyImage(srcImage, new BufferedImage(srcImage.getWidth(), srcImage.getHeight(), BufferedImage.TYPE_BYTE_BINARY));
    }
    
    public static BufferedImage copyImage(BufferedImage srcImage, BufferedImage destImage) {
        for (int y = 0; y < srcImage.getHeight(); y++) {
            for (int x = 0; x < srcImage.getWidth(); x++) {
                destImage.setRGB(x, y, srcImage.getRGB(x, y));
            }
        }
        
        return destImage;
    }
    
}

OCRUtils

package com.ocr.utils;

import net.sourceforge.tess4j.ITesseract;
import net.sourceforge.tess4j.Tesseract;

import java.awt.image.BufferedImage;
import java.io.File;

public class OCRUtils {
    
    public static String DEFAULT_LANG="eng";
    public static String DATA_PATH="D:/temp/test_data/";
    
    /**
     * 根据图片文件进行识别
     * 
     * @param imageFile 图片文件
     * @param lang 指定语言库
     * @return 识别文本信息
     */
    public static String doOCRFromFile(File imageFile,String lang) throws Exception {
        ITesseract instance = new Tesseract();
        instance.setDatapath(DATA_PATH); //指定语言库目录 
        instance.setTessVariable("user_defined_dpi", "300");
        instance.setLanguage(lang);
        String result = instance.doOCR(imageFile);
        return result;
    }
    
    public static String doOCRFromFile(File imageFile) throws Exception {
        return doOCRFromFile(imageFile,DEFAULT_LANG);
    }
    
    /**
     * 根据图片流进行识别
     */
    public static String doOCRFromImgBuffer(BufferedImage bufferedImage,String lang) throws Exception {
        ITesseract instance = new Tesseract();
        instance.setDatapath(DATA_PATH);
        instance.setTessVariable("user_defined_dpi", "300");
        instance.setLanguage(lang);
        String result = instance.doOCR(bufferedImage);
        
        return result;
    }
    
    public static String doOCRFromImgBuffer(BufferedImage bufferedImage) throws Exception {
        return doOCRFromImgBuffer(bufferedImage,DEFAULT_LANG);
    }
    
}

WindowsUtils

package com.ocr.utils;

import com.sun.jna.platform.win32.User32;
import com.sun.jna.platform.win32.WinDef.HWND;
import com.sun.jna.platform.win32.WinDef.RECT;

import java.awt.*;
import java.awt.image.BufferedImage;
import java.io.IOException;

public class WindowsUtils {
    
    /**
     * 截图：指定屏幕区域 
     * 参数为截图左上角坐标(x1,y1)+右下角坐标(x2,y2)
     */
    public static BufferedImage captureImg(int x1, int y1, int x2, int y2) throws Exception {
        Dimension screenSize = Toolkit.getDefaultToolkit().getScreenSize();
        Rectangle screenRectangle = new Rectangle(screenSize);
        Robot robot = new Robot();
        BufferedImage image = robot.createScreenCapture(screenRectangle);
        BufferedImage subimage = image.getSubimage(x1, y1, x2, y2);
        return subimage;
    }
    
    /**
     * 截图：指定窗口(使用AWT)
     */
    public static BufferedImage captureWindowAndActive(HWND hWnd) throws AWTException, IOException {
        RECT r = new RECT();
        Rectangle rect;
        User32.INSTANCE.GetWindowRect(hWnd, r);
        User32.INSTANCE.ShowWindow(hWnd, User32.INSTANCE.SW_SHOWNORMAL); //如果最小化，恢复显示
        User32.INSTANCE.SetForegroundWindow(hWnd); //激活显示
        rect = r.toRectangle();
        Robot robot = new Robot();
        BufferedImage image = robot.createScreenCapture(rect);
        return image;
    }
    
}

3、测试Demo

Demo

package com.ocr;

import com.ocr.utils.ImgFileUtils;
import com.ocr.utils.ImgUtils;
import com.ocr.utils.OCRUtils;
import com.ocr.utils.WindowsUtils;
import com.sun.jna.platform.win32.User32;
import com.sun.jna.platform.win32.WinDef;

import java.io.File;

public class DemoOCR {
    private static String WIN_TITLE="测试OCR.txt - 记事本";
    private static String PICTURE_PATH = System.getProperty("user.dir")+"/picture";

    /**
     * 测试OCR：指定窗口截图&OCR识别
     */
    public static void testCapture() throws Exception {
        // 截图保存的路径
        File imgFile = new File(PICTURE_PATH + "/capture.png");
        if (!imgFile.getParentFile().exists()) {
            imgFile.getParentFile().mkdirs();
        }

        // 第一个参数是Windows窗体的窗体类，第二个参数是窗体的标题。
        WinDef.HWND hWnd = User32.INSTANCE.FindWindow(null, WIN_TITLE);
        System.out.println("找到窗体："+hWnd);

        if(hWnd==null){
            System.out.println("未找到窗口");
        }else{
            // 保存截图
            ImgFileUtils.saveAsPNG(ImgUtils.clipImage(WindowsUtils.captureWindowAndActive(hWnd)), imgFile); //Active解决有些窗口截图不正常
            //String ocrRs = OCRUtils.doOCRFromFile(imgFile);
            String ocrRs = OCRUtils.doOCRFromImgBuffer(ImgUtils.clipImage(ImgUtils.grayImage(WindowsUtils.captureWindowAndActive(hWnd)))); // 灰化效果
            System.out.println("识别窗体文本信息："+ocrRs); //OCR识别，图像转文本。
        }
    }

    /**
     * main method
     */
    public static void main(String[] args) {
        System.out.println("OCR文字识别已启动！");
        try {
            //设置训练库的位置
            OCRUtils.DATA_PATH=System.getProperty("user.dir")+"/config";
            OCRUtils.DEFAULT_LANG="chi_sim"; //eng ：英文  chi_sim ：简体中文

            //测试OCR：指定窗口截图&OCR识别
            WIN_TITLE="测试OCR.txt - 记事本"; //用记事本打开测试文本
            testCapture();

            //测试识别图片
            String ocrText = OCRUtils.doOCRFromFile(new File(PICTURE_PATH+"/capture1.png")); // 灰化效果
            System.out.println("识别文本信息："+ocrText); //OCR识别，图像转文本

        } catch (Exception e) {
            e.printStackTrace();
        }
    }
}

在项目根目录新建两个文件夹：
1.picture用于存放用于识别的图片；
2.config用来存放你下载的语言包；

最后修改：2022 年 04 月 11 日

给我一点小钱钱也很高兴啦！o(*￣▽￣*)ブ

Java Tess4J OCR文字识别实现

admin • 2022 年 04 月 10 日

<h4>Tess4J简介</h4><p>Tesseract-OCR支持中文识别，并且开源和提供全套的训练工具，是快速低成本开发的首选。而Tess4J则是Tesseract在Java PC上的应用。在英文和数字识别中性能还是不错的，但是在中文识别中，无论速度还是识别率还是较弱，建议有条件的话，针对场景进行训练，会获得较好结果。<br>项目地址：<span class="external-link"><a class="no-external-link" href="https://github.com/tesseract-ocr" target="_blank"><i data-feather="external-link"></i>https://github.com/tesseract-ocr</a></span><br>语言包下载地址：<span class="external-link"><a class="no-external-link" href="https://github.com/tesseract-ocr/tessdata" target="_blank"><i data-feather="external-link"></i>https://github.com/tesseract-ocr/tessdata</a></span></p><h4>Demo</h4><p>下面附上我自己的测试过程：<br>（1）新建一个SpringBoot工程，我用的版本是2.5.10。<br>（2）后端相关类和配置：</p><h5>1、引入pom.xml配置：</h5><p><div class="panel panel-default collapse-panel box-shadow-wrap-lg"><div class="panel-heading panel-collapse" data-toggle="collapse" data-target="#collapse-70d4b3e1c5670ba7d9bf54d38ec859ea100" aria-expanded="true"><div class="accordion-toggle"><span style="">Maven依赖</span>
<i class="pull-right fontello icon-fw fontello-angle-right"></i>
</div>
</div>
<div class="panel-body collapse-panel-body">
<div id="collapse-70d4b3e1c5670ba7d9bf54d38ec859ea100" class="collapse collapse-content"><p></p></p><pre><code class="lang-Java">        &lt;!-- ocr --&gt;
        &lt;dependency&gt;
            &lt;groupId&gt;net.sourceforge.tess4j&lt;/groupId&gt;
            &lt;artifactId&gt;tess4j&lt;/artifactId&gt;
            &lt;version&gt;5.0.0&lt;/version&gt;
        &lt;/dependency&gt;
        &lt;dependency&gt;
            &lt;groupId&gt;net.java.dev.jna&lt;/groupId&gt;
            &lt;artifactId&gt;jna-platform&lt;/artifactId&gt;
            &lt;version&gt;5.11.0&lt;/version&gt;
        &lt;/dependency&gt;</code></pre><p><p></p></div></div></div></p><h5>2、相关Utils工具类：</h5><p><div class="panel panel-default collapse-panel box-shadow-wrap-lg"><div class="panel-heading panel-collapse" data-toggle="collapse" data-target="#collapse-5b4b84b420c41ec4b9fdf5ffacf231b260" aria-expanded="true"><div class="accordion-toggle"><span style="">ImgFileUtils</span>
<i class="pull-right fontello icon-fw fontello-angle-right"></i>
</div>
</div>
<div class="panel-body collapse-panel-body">
<div id="collapse-5b4b84b420c41ec4b9fdf5ffacf231b260" class="collapse collapse-content"><p></p></p><pre><code class="lang-Java">package com.ocr.utils;

import javax.imageio.ImageIO;
import java.awt.image.BufferedImage;
import java.io.File;
import java.io.IOException;
import java.io.OutputStream;

public class ImgFileUtils {
    
    /**
     * 存为PNG格式
     */
    public static void saveToFile(BufferedImage subimage, File file) throws IOException {
        ImageIO.write(subimage, &quot;png&quot;, file);
    }
    
    /** 
     * 存为PNG格式 
     */
    public static void saveAsPNG(BufferedImage subimage, File file) throws IOException {
        ImageIO.write(subimage, &quot;png&quot;, file);
    }
    
    /** 
     * 存为JPEG格式图像文件 
     */
    public static void saveAsJPEG(BufferedImage subimage, File file) throws IOException {
        ImageIO.write(subimage, &quot;JPEG&quot;, file);
    }
    
    /** 
     * 写入一个OutputStream 
     */
    public static void write(BufferedImage subimage, OutputStream out) throws IOException {
        ImageIO.write(subimage, &quot;png&quot;, out);
    }
    
}</code></pre><p><p></p></div></div></div><br><div class="panel panel-default collapse-panel box-shadow-wrap-lg"><div class="panel-heading panel-collapse" data-toggle="collapse" data-target="#collapse-88a3343d45ac5f1f7d25ec130b7c757585" aria-expanded="true"><div class="accordion-toggle"><span style="">ImgUtils</span>
<i class="pull-right fontello icon-fw fontello-angle-right"></i>
</div>
</div>
<div class="panel-body collapse-panel-body">
<div id="collapse-88a3343d45ac5f1f7d25ec130b7c757585" class="collapse collapse-content"><p></p></p><pre><code class="lang-Java">package com.ocr.utils;

import java.awt.image.BufferedImage;

public class ImgUtils {
    
    /**
     * 裁剪图片：去掉黑边
     */
    public static BufferedImage clipImage(BufferedImage srcImage) {
        return srcImage.getSubimage(8, 5, srcImage.getWidth() - 20, srcImage.getHeight() - 10);
    }
    
    /**
     * 灰度化
     */
    public static BufferedImage grayImage(BufferedImage srcImage) {
        return copyImage(srcImage, new BufferedImage(srcImage.getWidth(), srcImage.getHeight(), BufferedImage.TYPE_BYTE_GRAY));
    }
    
    /**
     * 二值化
     */
    public static BufferedImage binaryImage(BufferedImage srcImage) {
        return copyImage(srcImage, new BufferedImage(srcImage.getWidth(), srcImage.getHeight(), BufferedImage.TYPE_BYTE_BINARY));
    }
    
    public static BufferedImage copyImage(BufferedImage srcImage, BufferedImage destImage) {
        for (int y = 0; y &lt; srcImage.getHeight(); y++) {
            for (int x = 0; x &lt; srcImage.getWidth(); x++) {
                destImage.setRGB(x, y, srcImage.getRGB(x, y));
            }
        }
        
        return destImage;
    }
    
}</code></pre><p><p></p></div></div></div><br><div class="panel panel-default collapse-panel box-shadow-wrap-lg"><div class="panel-heading panel-collapse" data-toggle="collapse" data-target="#collapse-130260b4b13e2858fa8983f9cf81b6d068" aria-expanded="true"><div class="accordion-toggle"><span style="">OCRUtils</span>
<i class="pull-right fontello icon-fw fontello-angle-right"></i>
</div>
</div>
<div class="panel-body collapse-panel-body">
<div id="collapse-130260b4b13e2858fa8983f9cf81b6d068" class="collapse collapse-content"><p></p></p><pre><code class="lang-Java">package com.ocr.utils;

import net.sourceforge.tess4j.ITesseract;
import net.sourceforge.tess4j.Tesseract;

import java.awt.image.BufferedImage;
import java.io.File;

public class OCRUtils {
    
    public static String DEFAULT_LANG=&quot;eng&quot;;
    public static String DATA_PATH=&quot;D:/temp/test_data/&quot;;
    
    /**
     * 根据图片文件进行识别
     * 
     * @param imageFile 图片文件
     * @param lang 指定语言库
     * @return 识别文本信息
     */
    public static String doOCRFromFile(File imageFile,String lang) throws Exception {
        ITesseract instance = new Tesseract();
        instance.setDatapath(DATA_PATH); //指定语言库目录 
        instance.setTessVariable(&quot;user_defined_dpi&quot;, &quot;300&quot;);
        instance.setLanguage(lang);
        String result = instance.doOCR(imageFile);
        return result;
    }
    
    public static String doOCRFromFile(File imageFile) throws Exception {
        return doOCRFromFile(imageFile,DEFAULT_LANG);
    }
    
    /**
     * 根据图片流进行识别
     */
    public static String doOCRFromImgBuffer(BufferedImage bufferedImage,String lang) throws Exception {
        ITesseract instance = new Tesseract();
        instance.setDatapath(DATA_PATH);
        instance.setTessVariable(&quot;user_defined_dpi&quot;, &quot;300&quot;);
        instance.setLanguage(lang);
        String result = instance.doOCR(bufferedImage);
        
        return result;
    }
    
    public static String doOCRFromImgBuffer(BufferedImage bufferedImage) throws Exception {
        return doOCRFromImgBuffer(bufferedImage,DEFAULT_LANG);
    }
    
}</code></pre><p><p></p></div></div></div><br><div class="panel panel-default collapse-panel box-shadow-wrap-lg"><div class="panel-heading panel-collapse" data-toggle="collapse" data-target="#collapse-bfcbc7f7872f8b7884b0ddbc5dc18fa116" aria-expanded="true"><div class="accordion-toggle"><span style="">WindowsUtils</span>
<i class="pull-right fontello icon-fw fontello-angle-right"></i>
</div>
</div>
<div class="panel-body collapse-panel-body">
<div id="collapse-bfcbc7f7872f8b7884b0ddbc5dc18fa116" class="collapse collapse-content"><p></p></p><pre><code class="lang-Java">package com.ocr.utils;

import com.sun.jna.platform.win32.User32;
import com.sun.jna.platform.win32.WinDef.HWND;
import com.sun.jna.platform.win32.WinDef.RECT;

import java.awt.*;
import java.awt.image.BufferedImage;
import java.io.IOException;

public class WindowsUtils {
    
    /**
     * 截图：指定屏幕区域 
     * 参数为截图左上角坐标(x1,y1)+右下角坐标(x2,y2)
     */
    public static BufferedImage captureImg(int x1, int y1, int x2, int y2) throws Exception {
        Dimension screenSize = Toolkit.getDefaultToolkit().getScreenSize();
        Rectangle screenRectangle = new Rectangle(screenSize);
        Robot robot = new Robot();
        BufferedImage image = robot.createScreenCapture(screenRectangle);
        BufferedImage subimage = image.getSubimage(x1, y1, x2, y2);
        return subimage;
    }
    
    /**
     * 截图：指定窗口(使用AWT)
     */
    public static BufferedImage captureWindowAndActive(HWND hWnd) throws AWTException, IOException {
        RECT r = new RECT();
        Rectangle rect;
        User32.INSTANCE.GetWindowRect(hWnd, r);
        User32.INSTANCE.ShowWindow(hWnd, User32.INSTANCE.SW_SHOWNORMAL); //如果最小化，恢复显示
        User32.INSTANCE.SetForegroundWindow(hWnd); //激活显示
        rect = r.toRectangle();
        Robot robot = new Robot();
        BufferedImage image = robot.createScreenCapture(rect);
        return image;
    }
    
}</code></pre><p><p></p></div></div></div></p><h5>3、测试Demo</h5><p><div class="panel panel-default collapse-panel box-shadow-wrap-lg"><div class="panel-heading panel-collapse" data-toggle="collapse" data-target="#collapse-91e198aeaf85e8f2fc329f0ef658449d12" aria-expanded="true"><div class="accordion-toggle"><span style="">Demo</span>
<i class="pull-right fontello icon-fw fontello-angle-right"></i>
</div>
</div>
<div class="panel-body collapse-panel-body">
<div id="collapse-91e198aeaf85e8f2fc329f0ef658449d12" class="collapse collapse-content"><p></p></p><pre><code class="lang-Java">package com.ocr;

import com.ocr.utils.ImgFileUtils;
import com.ocr.utils.ImgUtils;
import com.ocr.utils.OCRUtils;
import com.ocr.utils.WindowsUtils;
import com.sun.jna.platform.win32.User32;
import com.sun.jna.platform.win32.WinDef;

import java.io.File;

public class DemoOCR {
    private static String WIN_TITLE=&quot;测试OCR.txt - 记事本&quot;;
    private static String PICTURE_PATH = System.getProperty(&quot;user.dir&quot;)+&quot;/picture&quot;;

/**
     * 测试OCR：指定窗口截图&amp;OCR识别
     */
    public static void testCapture() throws Exception {
        // 截图保存的路径
        File imgFile = new File(PICTURE_PATH + &quot;/capture.png&quot;);
        if (!imgFile.getParentFile().exists()) {
            imgFile.getParentFile().mkdirs();
        }

// 第一个参数是Windows窗体的窗体类，第二个参数是窗体的标题。
        WinDef.HWND hWnd = User32.INSTANCE.FindWindow(null, WIN_TITLE);
        System.out.println(&quot;找到窗体：&quot;+hWnd);

if(hWnd==null){
            System.out.println(&quot;未找到窗口&quot;);
        }else{
            // 保存截图
            ImgFileUtils.saveAsPNG(ImgUtils.clipImage(WindowsUtils.captureWindowAndActive(hWnd)), imgFile); //Active解决有些窗口截图不正常
            //String ocrRs = OCRUtils.doOCRFromFile(imgFile);
            String ocrRs = OCRUtils.doOCRFromImgBuffer(ImgUtils.clipImage(ImgUtils.grayImage(WindowsUtils.captureWindowAndActive(hWnd)))); // 灰化效果
            System.out.println(&quot;识别窗体文本信息：&quot;+ocrRs); //OCR识别，图像转文本。
        }
    }

/**
     * main method
     */
    public static void main(String[] args) {
        System.out.println(&quot;OCR文字识别已启动！&quot;);
        try {
            //设置训练库的位置
            OCRUtils.DATA_PATH=System.getProperty(&quot;user.dir&quot;)+&quot;/config&quot;;
            OCRUtils.DEFAULT_LANG=&quot;chi_sim&quot;; //eng ：英文  chi_sim ：简体中文

//测试OCR：指定窗口截图&amp;OCR识别
            WIN_TITLE=&quot;测试OCR.txt - 记事本&quot;; //用记事本打开测试文本
            testCapture();

//测试识别图片
            String ocrText = OCRUtils.doOCRFromFile(new File(PICTURE_PATH+&quot;/capture1.png&quot;)); // 灰化效果
            System.out.println(&quot;识别文本信息：&quot;+ocrText); //OCR识别，图像转文本

} catch (Exception e) {
            e.printStackTrace();
        }
    }
}</code></pre><p><p></p></div></div></div><br><div class="tip inlineBlock error">

在项目根目录新建两个文件夹：<br>1.<code>picture</code>用于存放用于识别的图片；<br>2.<code>config</code>用来存放你下载的语言包；
</div></p>

Java Tess4J OCR文字识别实现

Tess4J简介

Demo

1、引入pom.xml配置：

2、相关Utils工具类：

3、测试Demo

2021最新官方IP地址查询接口

SpringBoot基于Hutool工具实现接口限流

宝塔面板部署ZFile网盘系统（原创改良版）

宝塔面板部署PanIndex网盘系统（原创改良版）

MyBatis-Plus代码生成器（基于3.5.1版本）

IDEA+Maven多环境配置

IDEA中打开项目所有引入的jar包不识别

e.printStackTrace();有什么危害？

去掉if...else的七种绝佳之法

JAVA快速开发微信机器人-新星框架（NewBot-Nova）

Java Tess4J OCR文字识别实现