代码复制然后导入pdfbox-1.8.16jar就可以用了,jar包的下载路径如下
https://www.apache.org/dyn/closer.lua/pdfbox/1.8.16/pdfbox-1.8.16.jar
package PdfAndWord;
import org.apache.pdfbox.pdmodel.PDDocument;
import org.apache.pdfbox.util.PDFTextStripper;
import java.io.*;
/**
* pdf转换word格式<p/>
* <p>
*
*
* @author jianpipi
* @version V1.0.0
* @create 2021/6/23
*/
public class PdfChangeWord
{
public static void main(String[] args){
try{
String pdfFilePath = "D:/xxxxx.pdf";
PDDocument pdfDoc = PDDocument.load(new File(pdfFilePath));
int pageNumber = pdfDoc.getNumberOfPages();
pdfFilePath = pdfFilePath.substring(0, pdfFilePath.lastIndexOf("."));
String newWordFileName = pdfFilePath + ".doc";
FileOutputStream fos = new FileOutputStream(newWordFileName);
Writer writer = new OutputStreamWriter(fos, "UTF-8");
PDFTextStripper stripper = new PDFTextStripper();
// 是否排序
stripper.setSortByPosition(true);
// 转换的初始页
stripper.setStartPage(1);
// 转换的结束页
stripper.setEndPage(pageNumber);
stripper.writeText(pdfDoc, writer);
System.out.println("pdf转换word转换完成!");
writer.close();
pdfDoc.close();
}
catch (IOException e){
System.out.println("啊哦出异常了!");
e.printStackTrace();
}
}
}