From c545063654fda09763ef9199ad4a8ce42efc0b12 Mon Sep 17 00:00:00 2001 From: zjh <1084500556@qq.com> Date: 星期三, 10 一月 2024 17:53:51 +0800 Subject: [PATCH] zjh 2024/01/10--1 --- ltkj-admin/src/test/java/ImageTextExtractor.java | 23 ++++++++++++++++------- 1 files changed, 16 insertions(+), 7 deletions(-) diff --git a/ltkj-admin/src/test/java/ImageTextExtractor.java b/ltkj-admin/src/test/java/ImageTextExtractor.java index 23c0b25..c02f45a 100644 --- a/ltkj-admin/src/test/java/ImageTextExtractor.java +++ b/ltkj-admin/src/test/java/ImageTextExtractor.java @@ -1,16 +1,24 @@ +import net.sourceforge.tess4j.ITesseract; import net.sourceforge.tess4j.Tesseract; import net.sourceforge.tess4j.TesseractException; +import javax.imageio.ImageIO; +import java.awt.image.BufferedImage; import java.io.File; +import java.io.IOException; public class ImageTextExtractor { - public static String extractTextFromImage(String imagePath) { + public static String extractTextFromImage(String imagePath) throws IOException { File imageFile = new File(imagePath); - Tesseract tesseract = new Tesseract(); + ITesseract instance = new Tesseract(); // JNA Interface Mapping try { - tesseract.setLanguage("eng"); - String result = tesseract.doOCR(imageFile); + instance.setDatapath("D:\\develop\\OCR\\tessdata"); // set tessdata path + instance.setLanguage("chi_sim"); // set recognition language +// instance.setLanguage("eng"); // set recognition language + instance.setTessVariable("user_defined_dpi","300"); + BufferedImage image = ImageIO.read(imageFile); + String result = instance.doOCR(image); return result; } catch (TesseractException e) { e.printStackTrace(); @@ -18,9 +26,10 @@ } } - public static void main(String[] args) { - String imagePath = "C:\\Users\\w\\Pictures\\Saved Pictures\\涓崕浜烘皯鍏卞拰鍥戒竾宀�.jpg"; + public static void main(String[] args) throws IOException { + String imagePath = "C:\\Users\\w\\Pictures\\Saved Pictures\\333.png"; String extractedText = extractTextFromImage(imagePath); System.out.println(extractedText); } -} \ No newline at end of file +} + -- Gitblit v1.8.0