pdf 转html java_Java实现Word/Pdf/TXT转html

1 packagecom.svse.controller;2

3 importjavax.xml.parsers.DocumentBuilderFactory;4 importjavax.xml.parsers.ParserConfigurationException;5 importjavax.xml.transform.OutputKeys;6 importjavax.xml.transform.Transformer;7 importjavax.xml.transform.TransformerException;8 importjavax.xml.transform.TransformerFactory;9 importjavax.xml.transform.dom.DOMSource;10 importjavax.xml.transform.stream.StreamResult;11

12 importorg.apache.poi.hwpf.HWPFDocument;13 importorg.apache.poi.hwpf.converter.PicturesManager;14 importorg.apache.poi.hwpf.converter.WordToHtmlConverter;15 importorg.apache.poi.hwpf.usermodel.PictureType;16 importorg.apache.poi.xwpf.converter.core.BasicURIResolver;17 importorg.apache.poi.xwpf.converter.core.FileImageExtractor;18 importorg.apache.poi.xwpf.converter.core.FileURIResolver;19 importorg.apache.poi.xwpf.converter.core.IURIResolver;20 importorg.apache.poi.xwpf.converter.core.IXWPFConverter;21 importorg.apache.poi.xwpf.converter.xhtml.XHTMLConverter;22 importorg.apache.poi.xwpf.converter.xhtml.XHTMLOptions;23 importorg.apache.poi.xwpf.usermodel.XWPFDocument;24 /**

25 * word 转换成html26 */

27 public classTestWordToHtml {28

29 public static final String STORAGEPATH="C://works//files//";30 public static final String IP="192.168.30.222";31 public static

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
以下是Java实现Word/Pdf/TXTHTML的示例代码,您可以根据需要进行修改以实现转换WordPdf: ```java import java.io.*; import org.apache.poi.hwpf.HWPFDocument; import org.apache.poi.hwpf.converter.WordToHtmlConverter; import org.apache.poi.hwpf.usermodel.Range; import org.apache.poi.xwpf.converter.core.BasicURIResolver; import org.apache.poi.xwpf.converter.core.FileImageExtractor; import org.apache.poi.xwpf.converter.core.IURIResolver; import org.apache.poi.xwpf.converter.core.XWPFConverterException; import org.apache.poi.xwpf.converter.html.*; import org.apache.poi.xwpf.usermodel.XWPFDocument; public class ConvertToHtml { public static void main(String[] args) throws Exception { String inputFile = "input.docx"; String outputFile = "output.html"; convertToHtml(inputFile, outputFile); } public static void convertToHtml(String inputFile, String outputFile) throws Exception { if (inputFile.endsWith(".docx")) { convertDocxToHtml(inputFile, outputFile); } else if (inputFile.endsWith(".doc")) { convertDocToHtml(inputFile, outputFile); } else if (inputFile.endsWith(".txt")) { convertTxtToHtml(inputFile, outputFile); } else { throw new IllegalArgumentException("Unsupported file type: " + inputFile); } } private static void convertDocxToHtml(String inputFile, String outputFile) throws IOException, XWPFConverterException { try (InputStream in = new FileInputStream(inputFile); OutputStream out = new FileOutputStream(outputFile)) { XWPFDocument document = new XWPFDocument(in); IURIResolver resolver = new BasicURIResolver("."); FileImageExtractor extractor = new FileImageExtractor(new File(".")); XHTMLConverter.getInstance().convert(document, out, resolver, extractor); } } private static void convertDocToHtml(String inputFile, String outputFile) throws IOException { try (InputStream in = new FileInputStream(inputFile); HWPFDocument document = new HWPFDocument(in); OutputStream out = new FileOutputStream(outputFile)) { WordToHtmlConverter converter = new WordToHtmlConverter(DocumentBuilderFactory.newInstance().newDocumentBuilder().newDocument()); converter.processDocument(document); Range range = document.getRange(); out.write(converter.getDocument().getBytes()); } catch (ParserConfigurationException e) { throw new IOException(e); } } private static void convertTxtToHtml(String inputFile, String outputFile) throws IOException { try (BufferedReader in = new BufferedReader(new FileReader(inputFile)); PrintWriter out = new PrintWriter(new FileWriter(outputFile))) { out.println("<html>"); out.println("<body>"); String line; while ((line = in.readLine()) != null) { out.println(line); out.println("<br>"); } out.println("</body>"); out.println("</html>"); } } } ``` 您可以使用此代码将WordPdfTxt文件转换HTML,然后使用其他工具将HTML转换PdfWord。例如,您可以使用iText库将HTML转换Pdf,或使用Apache POI将HTML转换Word

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值