java文档合并,在合并doc格式时报错Package should contain a content type part [M1.13]代码如下,如何解决?

java文档合并,在合并doc格式时报错Package should contain a content type part [M1.13]
代码如下(怀疑是只支持docx格式的文档,请问如何更改)


package com.common.utils;


import org.apache.poi.openxml4j.opc.OPCPackage;
import org.apache.poi.openxml4j.util.ZipSecureFile;
import org.apache.poi.xwpf.usermodel.Document;
import org.apache.poi.xwpf.usermodel.XWPFDocument;
import org.apache.poi.xwpf.usermodel.XWPFPictureData;
import org.apache.xmlbeans.XmlOptions;
import org.openxmlformats.schemas.wordprocessingml.x2006.main.CTBody;

import java.io.File;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.OutputStream;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

/**
 * @Author mischen
 * @Description 文件合并 只支持.docx
 * @Date 2022/11/21 16:30
 * @Version 1.0
 */
public class DocxMerge {
    public static void main(String[] args) {
        File file1 = new File("F:\\test1\\3.docx");
        List<File> targetFile1 = new ArrayList<>();
        targetFile1.add(new File("F:\\test1\\a.docx"));
        targetFile1.add(new File("F:\\test1\\01-系统架构设计师教程(第4版)_划了重点.docx"));

        appendDocx(file1, targetFile1);
        System.out.println("合并成功!!!");
    }

    /**
     * 把多个docx文件合并成一个
     *
     * @param outfile    输出文件
     * @param targetFile 目标文件
     */
    public static void appendDocx(File outfile, List<File> targetFile) {
        try {

            OutputStream dest = new FileOutputStream(outfile);
            ArrayList<XWPFDocument> documentList = new ArrayList<>();
            XWPFDocument doc = null;
            for (int i = 0; i < targetFile.size(); i++) {
                ZipSecureFile.setMinInflateRatio(-1.0d);
                FileInputStream in = new FileInputStream(targetFile.get(i).getPath());
                OPCPackage open = OPCPackage.open(in);
                XWPFDocument document = new XWPFDocument(open);
                documentList.add(document);
            }
            for (int i = 0; i < documentList.size(); i++) {
                doc = documentList.get(0);
                if (i != 0) {
                    //解决word合并完后,所有表格都紧紧挨在一起,没有分页。加上了分页符可解决
                    documentList.get(i).createParagraph().setPageBreak(true);
                    appendBody(doc, documentList.get(i));
                }
            }

            doc.write(dest);
        } catch (Exception e) {
            e.printStackTrace();
        }
    }

    public static void appendBody(XWPFDocument src, XWPFDocument append) throws Exception {
        CTBody src1Body = src.getDocument().getBody();
        CTBody src2Body = append.getDocument().getBody();

        List<XWPFPictureData> allPictures = append.getAllPictures();
        // 记录图片合并前及合并后的ID
        Map<String, String> map = new HashMap<>();
        for (XWPFPictureData picture : allPictures) {
            String before = append.getRelationId(picture);
            //将原文档中的图片加入到目标文档中
            String after = src.addPictureData(picture.getData(), Document.PICTURE_TYPE_PNG);
            map.put(before, after);
        }
        //这个代码主要解决合并word报错,解析抛出压缩炸弹
        ZipSecureFile.setMinInflateRatio(-1.0d);
        appendBody(src1Body, src2Body, map);

    }

    private static void appendBody(CTBody src, CTBody append, Map<String, String> map) throws Exception {
        XmlOptions optionsOuter = new XmlOptions();
        optionsOuter.setSaveOuter();
        String appendString = append.xmlText(optionsOuter);

        String srcString = src.xmlText();
        String prefix = srcString.substring(0, srcString.indexOf(">") + 1);
        String mainPart = srcString.substring(srcString.indexOf(">") + 1, srcString.lastIndexOf("<"));
        String sufix = srcString.substring(srcString.lastIndexOf("<"));
        String addPart = appendString.substring(appendString.indexOf(">") + 1, appendString.lastIndexOf("<"));
        //下面这部分可以去掉,我加上的原因是合并的时候,有时候出现打不开的情况,对照document.xml将某些标签去掉就可以正常打开了
        addPart = addPart.replaceAll("w14:paraId=\"[A-Za-z0-9]{1,10}\"", "");
        addPart = addPart.replaceAll("w14:textId=\"[A-Za-z0-9]{1,10}\"", "");
        addPart = addPart.replaceAll("w:rsidP=\"[A-Za-z0-9]{1,10}\"", "");
        addPart = addPart.replaceAll("w:rsidRPr=\"[A-Za-z0-9]{1,10}\"", "");
        addPart = addPart.replace("<w:headerReference r:id=\"rId8\" w:type=\"default\"/>","");
        addPart = addPart.replace("<w:footerReference r:id=\"rId9\" w:type=\"default\"/>","");
        addPart = addPart.replace("xsi:nil=\"true\"","");

        if (map != null && !map.isEmpty()) {
            //对xml字符串中图片ID进行替换
            for (Map.Entry<String, String> set : map.entrySet()) {
                addPart = addPart.replace(set.getKey(), set.getValue());
            }
        }
        //将两个文档的xml内容进行拼接
        CTBody makeBody = CTBody.Factory.parse(prefix + mainPart + addPart + sufix);

        src.set(makeBody);
    }
}



我写个demo

import java.io.File;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.ArrayList;
import java.util.List;

import org.apache.poi.hwpf.HWPFDocument;
import org.apache.poi.hwpf.usermodel.Range;
import org.apache.poi.openxml4j.exceptions.InvalidFormatException;
import org.apache.poi.openxml4j.opc.OPCPackage;
import org.apache.poi.xwpf.usermodel.XWPFDocument;

/**
 * @author icepippip
 * @Description 文件合并 支持.doc和.docx
 * @date 2023/5/29 20:18
 * @Version 1.0
 */
public class DocMerge {
    
    public static void main(String[] args) throws IOException, InvalidFormatException {
        File file1 = new File("F:\\test1\\3.docx");
        List<File> targetFile1 = new ArrayList<>();
        targetFile1.add(new File("F:\\test1\\a.docx"));
        targetFile1.add(new File("F:\\test1\\01-系统架构设计师教程(第4版)_划了重点.doc"));
 
        File outfile = new File("F:\\test1\\merged.docx");
        mergeDocs(outfile, targetFile1);
        System.out.println("合并成功!");
    }
    
    /**
     * 合并多个doc和docx文件
     *
     * @param outfile 目标文件
     * @param files   源文件列表
     * @throws IOException
     * @throws InvalidFormatException
     */
    public static void mergeDocs(File outfile, List<File> files) throws IOException, InvalidFormatException {
        OutputStream out = new FileOutputStream(outfile);
        List<InputStream> streams = new ArrayList<>();
        
        try {
            for (File file : files) {
                String fileName = file.getName();
                InputStream in = new FileInputStream(file);
                if (fileName.endsWith(".doc")) {
                    HWPFDocument doc = new HWPFDocument(in);
                    Range range = doc.getRange();
                    appendRange(out, range);
                    doc.close();
                } else if (fileName.endsWith(".docx")) {
                    OPCPackage pkg = OPCPackage.open(in);
                    XWPFDocument doc = new XWPFDocument(pkg);
                    appendDocument(out, doc);
                    doc.close();
                }
                in.close();
            }
        } finally {
            for (InputStream stream : streams) {
                stream.close();
            }
            out.close();
        }
    }
    
    /**
     * 将一个HWPFDocument的Range追加到输出流中
     *
     * @param out   输出流
     * @param range 范围
     * @throws IOException
     */
    public static void appendRange(OutputStream out, Range range) throws IOException {
        out.write(range.serialize());
    }
    
    /**
     * 将一个XWPFDocument追加到输出流中
     *
     * @param out 输出流
     * @param doc 文档
     * @throws IOException
     */
    public static void appendDocument(OutputStream out, XWPFDocument doc) throws IOException {
        doc.write(out);
    }
}

pom 依赖如下

<dependency>
    <groupId>org.apache.poi</groupId>
    <artifactId>poi</artifactId>
    <version>4.1.2</version>
</dependency>
<dependency>
    <groupId>org.apache.poi</groupId>
    <artifactId>poi-ooxml</artifactId>
    <version>4.1.2</version>
</dependency>
<dependency>
    <groupId>org.apache.poi</groupId>
    <artifactId>poi-ooxml-schemas</artifactId>
    <version>4.1.2</version>
</dependency>
<dependency>
    <groupId>org.apache.poi</groupId>
    <artifactId>poi-scratchpad</artifactId>
    <version>4.1.2</version>
</dependency>