依赖
<!-- pdf表格解析依赖包 -->
<dependency>
<groupId>org.apache.pdfbox</groupId>
<artifactId>pdfbox</artifactId>
<version>2.0.24</version>
</dependency>
<dependency>
<groupId>technology.tabula</groupId>
<artifactId>tabula</artifactId>
<version>1.0.3</version>
</dependency>
<!-- json字符串反序列化依赖包 -->
<dependency>
<groupId>com.fasterxml.jackson.core</groupId>
<artifactId>jackson-databind</artifactId>
<version>2.9.5</version>
</dependency>
代码
//-f导出格式,默认CSV (一定要大写)
//-p 指导出哪页,al1是所有
//path D:\\1xx.pdf
//-1 强制使用点阵模式提取PDF (关键在于这儿)
private static void parse() throws ParseException, IOException {
long start = System.currentTimeMillis();
St