多个word文档合并为一个文档 Java实现-CSDN博客

本文链接：https://blog.csdn.net/weixin_47509784/article/details/121272373

该代码实现了一个Java工具，用于合并多个Word文档。它能够将多个文档依次添加到一个新的Word文档中，每个文档开始时插入分页符，适合格式固定的文档。通过Apache POI库处理Word文档，并使用Map来处理图片ID的替换，确保合并后图片仍然能够正确显示。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

不用额外新建一个空文档，适合需要不断往一个文档中添加其他文档的情况。适合每页格式固定，添加文件新起一页的情况。可进行测试。

package could.com.hanwen.govapi.Test;

import org.apache.commons.collections.CollectionUtils;
import org.apache.poi.openxml4j.opc.OPCPackage;
import org.apache.poi.xwpf.usermodel.BreakType;
import org.apache.poi.xwpf.usermodel.Document;
import org.apache.poi.xwpf.usermodel.XWPFDocument;
import org.apache.poi.xwpf.usermodel.XWPFPictureData;
import org.apache.xmlbeans.XmlOptions;
import org.openxmlformats.schemas.wordprocessingml.x2006.main.CTBody;

import java.io.File;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.OutputStream;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

public class FileCopyUtil {
   public void aqscMergeDoc(String outPutPath, String mergeWord) {

		List<File> srcfile = new ArrayList<>();
		File file1 = new File(outPutPath);
		File file2 = new File(mergeWord);
		srcfile.add(file1);
		srcfile.add(file2);

		try {
			ArrayList<XWPFDocument> documentList = new ArrayList<>();
			for (int i = 0; i < srcfile.size(); i++) {
				FileInputStream in = new FileInputStream(srcfile.get(i).getPath());
				OPCPackage open = OPCPackage.open(in);
				XWPFDocument document = new XWPFDocument(open);
				documentList.add(document);
			}
			XWPFDocument doc = documentList.get(0);
			if (CollectionUtils.isEmpty(documentList)) {
				throw  new RuntimeException("待合并的word文档list为空");
			}
			int size = documentList.size();
			if (size > 1) {
				doc.createParagraph().setPageBreak(true);
				for (int i = 1; i < size; i++) {
					// 从第二个word开始合并
					XWPFDocument nextPageDoc = documentList.get(i);
					// 最后一页不需要设置分页符
					if (i != (size-1)) {
						nextPageDoc.createParagraph().setPageBreak(true);
					}
					appendBody(doc, nextPageDoc);
				}
			}
			new File(outPutPath).delete();
			OutputStream dest = new FileOutputStream(outPutPath);
			doc.write(dest);
		} catch (Exception e) {
			e.printStackTrace();
		}
	}
 public static void appendBody(XWPFDocument src, XWPFDocument append) throws Exception {
        CTBody src1Body = src.getDocument().getBody();
        CTBody src2Body = append.getDocument().getBody();
        List<XWPFPictureData> allPictures = append.getAllPictures();
        // 记录图片合并前及合并后的ID
        Map<String, String> map = new HashMap<>();
        for (XWPFPictureData picture : allPictures) {
            String before = append.getRelationId(picture);
            // 将原文档中的图片加入到目标文档中
            String after = src.addPictureData(picture.getData(), Document.PICTURE_TYPE_PNG);
            map.put(before, after);
        }
        appendBody(src1Body, src2Body, map);
    }

    private static void appendBody(CTBody src, CTBody append, Map<String, String> map) throws Exception {
        XmlOptions optionsOuter = new XmlOptions();
        optionsOuter.setSaveOuter();
        String appendString = append.xmlText(optionsOuter);
        String rgex = "<[\\s]*?w:sectPr[^>]*?>[\\s\\S]*?<[\\s]*?\\/[\\s]*?w:sectPr[\\s]*?>";
        appendString = appendString.replaceAll(rgex, "");
        String srcString = src.xmlText();
        String prefix = srcString.substring(0, srcString.indexOf(">"));
        String mainPart = srcString.substring(srcString.indexOf(">"), srcString.lastIndexOf("<"));
        String sufix = srcString.substring(srcString.lastIndexOf("<"));
        String addPart = appendString.substring(appendString.indexOf(">"), appendString.lastIndexOf("<"));
        if (map != null && !map.isEmpty()) {
            // 对xml字符串中图片ID进行替换
            for (Map.Entry<String, String> set : map.entrySet()) {
                addPart = addPart.replace(set.getKey(), set.getValue());
            }
        }
        // 将两个文档的xml内容进行拼接
        CTBody makeBody = CTBody.Factory.parse(prefix + mainPart + addPart + sufix);
        src.set(makeBody);
    }

    /*public static void main(String[] args) {
        List<File> srcfile = new ArrayList<>();
        File file1 = new File("F:\\安全生产责任制度.docx");
        File file2 = new File("F:\\安全生产责任制度新增.docx");
        srcfile.add(file1);
        srcfile.add(file2);
        try {
            ArrayList<XWPFDocument> documentList = new ArrayList<>();
            for (int i = 0; i < srcfile.size(); i++) {
                FileInputStream in = new FileInputStream(srcfile.get(i).getPath());
                OPCPackage open = OPCPackage.open(in);
                XWPFDocument document = new XWPFDocument(open);
                documentList.add(document);
            }
            XWPFDocument doc = documentList.get(0);
            if (CollectionUtils.isEmpty(documentList)) {
                throw  new RuntimeException("待合并的word文档list为空");
            }
            int size = documentList.size();
            if (size > 1) {
                doc.createParagraph().setPageBreak(true);
                for (int i = 1; i < size; i++) {
                    // 从第二个word开始合并
                    XWPFDocument nextPageDoc = documentList.get(i);
                    // 最后一页不需要设置分页符
                    if (i != (size-1)) {
                        nextPageDoc.createParagraph().setPageBreak(true);
                    }
                    appendBody(doc, nextPageDoc);
                }
            }

            new File("F:\\安全生产责任制度.docx").delete();
            OutputStream dest = new FileOutputStream("F:\\安全生产责任制度.docx");
            doc.write(dest);
        } catch (Exception e) {
            e.printStackTrace();
        }
    }*/
}

如果希望添加的文档直接接在上一文档末尾将srcString替换：

		// 去除分页符
		String srcString = src.xmlText().replaceAll( "<w:p><w:r><w:br w:type=\"page\"/></w:r></w:p>", "" ).replaceAll( "<w:r><w:br w:type=\"page\"/></w:r>", "" );