- 实现了 ITesseractOcrService接口中的 recognizePdfText 方法- 添加了 PDFBox 依赖用于处理 PDF 文件 - 在 TesseractOcrServiceImpl 中实现了 PDF 文件的文字提取和清理 - 在 WmsPurchasePlanController 中添加了识别 PDF 文件文字的 API 接口
40 lines
1.4 KiB
XML
40 lines
1.4 KiB
XML
<?xml version="1.0" encoding="UTF-8"?>
|
|
<project xmlns="http://maven.apache.org/POM/4.0.0"
|
|
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
|
|
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
|
|
<modelVersion>4.0.0</modelVersion>
|
|
<parent>
|
|
<groupId>com.klp</groupId>
|
|
<artifactId>klp-oa</artifactId>
|
|
<version>0.8.3</version>
|
|
</parent>
|
|
|
|
<artifactId>klp-wms</artifactId>
|
|
|
|
<properties>
|
|
<maven.compiler.source>8</maven.compiler.source>
|
|
<maven.compiler.target>8</maven.compiler.target>
|
|
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
|
|
</properties>
|
|
<dependencies>
|
|
<dependency>
|
|
<groupId>com.klp</groupId>
|
|
<artifactId>klp-common</artifactId>
|
|
<version>0.8.3</version>
|
|
</dependency>
|
|
<!-- https://mvnrepository.com/artifact/net.sourceforge.tess4j/tess4j -->
|
|
<dependency>
|
|
<groupId>net.sourceforge.tess4j</groupId>
|
|
<artifactId>tess4j</artifactId>
|
|
<version>5.11.0</version>
|
|
</dependency>
|
|
<!-- https://mvnrepository.com/artifact/org.apache.pdfbox/pdfbox -->
|
|
<dependency>
|
|
<groupId>org.apache.pdfbox</groupId>
|
|
<artifactId>pdfbox</artifactId>
|
|
<version>2.0.29</version>
|
|
</dependency>
|
|
|
|
</dependencies>
|
|
</project>
|