Procházet zdrojové kódy

file-service 添加 tess4j 依赖实现 ocr 功能

reghao před 2 měsíci
rodič
revize
409abc0289

+ 6 - 0
file/file-service/pom.xml

@@ -140,6 +140,12 @@
             <version>2.1.1</version>
         </dependency>
 
+        <dependency>
+            <groupId>net.sourceforge.tess4j</groupId>
+            <artifactId>tess4j</artifactId>
+            <version>5.3.0</version>
+        </dependency>
+
         <dependency>
             <groupId>org.springdoc</groupId>
             <artifactId>springdoc-openapi-ui</artifactId>

+ 17 - 0
file/file-service/src/test/java/DiskUnitTest.java

@@ -1,5 +1,7 @@
 import cn.reghao.tnb.file.app.zdisk.model.vo.FileTree;
 import cn.reghao.tnb.oss.api.constant.ObjectType;
+import net.sourceforge.tess4j.Tesseract;
+import org.junit.jupiter.api.Test;
 import org.mockito.junit.MockitoJUnitRunner;
 
 import java.io.File;
@@ -86,4 +88,19 @@ public class DiskUnitTest {
         });
         System.out.println("main-thread goto sleep...");*/
     }
+
+    @Test
+    public void ocrTest() throws Exception {
+        Tesseract tess = new Tesseract();
+        // 字库位置
+        tess.setDatapath("/home/reghao/Downloads/tess");
+        // 中英文混合
+        tess.setLanguage("eng+chi_sim");
+        //tess.setLanguage("chi_sim");
+//        tess.setLanguage("eng");
+
+        String imagePath = "/home/reghao/Downloads/1620438.png";
+        String result = tess.doOCR(new File(imagePath));
+        System.out.println(result);
+    }
 }