From e953fa49251f0baff0bc4b9adda91d6c1692646f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E8=91=A3=E5=93=B2=E5=A5=87?= <13840175730@139.com> Date: Wed, 24 Apr 2024 10:31:31 +0800 Subject: [PATCH] =?UTF-8?q?1.PDF=E8=AF=BB=E5=8F=96demo?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/main/java/com/dsic/gj_erp/Test.java | 25 ++++++++++++++++++++++--- 1 file changed, 22 insertions(+), 3 deletions(-) diff --git a/src/main/java/com/dsic/gj_erp/Test.java b/src/main/java/com/dsic/gj_erp/Test.java index ca960aa..99cadc4 100644 --- a/src/main/java/com/dsic/gj_erp/Test.java +++ b/src/main/java/com/dsic/gj_erp/Test.java @@ -1,7 +1,13 @@ package com.dsic.gj_erp; +import org.apache.pdfbox.pdmodel.PDDocument; +import org.apache.pdfbox.text.PDFTextStripper; import org.springframework.boot.SpringApplication; +import java.io.File; +import java.io.IOException; +import java.nio.file.Files; +import java.nio.file.Paths; import java.time.LocalDate; import java.time.Period; import java.util.List; @@ -9,10 +15,23 @@ import java.util.regex.Matcher; import java.util.regex.Pattern; public class Test { - public static void main(String[] args) { - String aaa="gagagag"; + public static void main(String[] args) throws IOException { + //String aaa="gagagag"; //System.out.println(aaa.split("@")[0]); - System.out.println("aaa = " + String.format("%03d",1)); + //System.out.println("aaa = " + String.format("%03d",1)); + + String pdfFilePath = "E:/B046HC103HN第046批量数控套料图2023-05-11.pdf"; // PDF文件路径 + PDDocument document = PDDocument.load(new File(pdfFilePath)); + PDFTextStripper stripper = new PDFTextStripper(); + String text = stripper.getText(document); + document.close(); + + // 输出提取的文本到控制台 + System.out.println(text); + + // 可以选择将文本写入文件 + String outputPath = "E:/B046HC103HN第046批量数控套料图2023-05-11.txt"; // 输出文本文件路径 + Files.write(Paths.get(outputPath), text.getBytes()); } }