doc转html - 易不易

link管理

链接快照平台

输入网页链接，自动生成快照
标签化管理网页链接

相关文章推荐

爱热闹的葫芦 · Column.IsIdentity ...· 2 周前 ·

兴奋的玉米 · Mapping Attributes✨ | ...· 2 周前 ·

文武双全的小笼包 · 《lua 程序设计》读书笔记（2）：数值 ...· 2 周前 ·

刀枪不入的马铃薯 · ASP.NET Core 中的配置 | ...· 2 周前 ·

呐喊的书签 · java循环出现异常，不终止程序，继续执行 ...· 4 天前 ·

彷徨的骆驼 · 以病人为中心以问题为导向 ...· 2 月前 ·

性感的凉面 · MySQL实战：轻松计算基于出生日期的年龄· 3 月前 ·

宽容的毛衣 · 聚焦2024汉诺威商用车展，未势能源携高效氢 ...· 3 月前 ·

有胆有识的槟榔 · 特征工程在营销组合建模中的应用：基于因果推断 ...· 3 月前 ·

冷冷的移动电源 · “柏林爱乐在上海”奏响首场音乐会 ...· 4 月前 ·

fr.opensagres.xdocreport fr.opensagres.xdocreport.document 1.0.5 fr.opensagres.xdocreport org.apache.poi.xwpf.converter.xhtml 1.0.5 　　　　 org.apache.poi poi-scratchpad 3.12

Java 代码

package com.zh.html2pdf.test;
import org.apache.poi.hwpf.HWPFDocument;
import org.apache.poi.hwpf.converter.WordToHtmlConverter;
import org.apache.poi.xwpf.converter.core.FileImageExtractor;
import org.apache.poi.xwpf.converter.core.FileURIResolver;
import org.apache.poi.xwpf.converter.xhtml.XHTMLConverter;
import org.apache.poi.xwpf.converter.xhtml.XHTMLOptions;
import org.apache.poi.xwpf.usermodel.XWPFDocument;
import org.w3c.dom.Document;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.transform.OutputKeys;
import javax.xml.transform.Transformer;
import javax.xml.transform.TransformerFactory;
import javax.xml.transform.dom.DOMSource;
import javax.xml.transform.stream.StreamResult;
import java.io.*;
public class CaseHtmTest {
    public static void main(String[] args) throws Exception {
        String filePath = "C:/Users/v/Desktop/doc/测试.docx";
        File file = new File(filePath);
        filePath=filePath.substring(0, filePath.lastIndexOf("/")+1);
        String name = file.getName().substring(0, file.getName().lastIndexOf("."));
        System.out.println(file.getName());
        if (file.getName().endsWith(".docx") || file.getName().endsWith(".DOCX")) {
                CaseHtmTest.docx(filePath ,file.getName(),name +".html");
        }else{
                CaseHtmTest.dox(filePath ,file.getName(),name +".html");
     * 转换docx
     * @param filePath
     * @param fileName
     * @param htmlName
     * @throws Exception
    public static void docx(String filePath ,String fileName,String htmlName) throws Exception{
        final String file = filePath + fileName;
        File f = new File(file);
// ) 加载word文档生成 XWPFDocument对象
        InputStream in = new FileInputStream(f);
        XWPFDocument document = new XWPFDocument(in);
// ) 解析 XHTML配置 (这里设置IURIResolver来设置图片存放的目录)
        File imageFolderFile = new File(filePath);
        XHTMLOptions options = XHTMLOptions.create().URIResolver(new FileURIResolver(imageFolderFile));
        options.setExtractor(new FileImageExtractor(imageFolderFile));
        options.setIgnoreStylesIfUnused(false);
        options.setFragment(true);
// ) 将 XWPFDocument转换成XHTML
        OutputStream out = new FileOutputStream(new File(filePath + htmlName));
        XHTMLConverter.getInstance().convert(document, out, options);
     * 转换doc
     * @param filePath
     * @param fileName
     * @param htmlName
     * @throws Exception
    public static void dox(String filePath ,String fileName,String htmlName) throws Exception{
        final String file = filePath + fileName;
        InputStream input = new FileInputStream(new File(file));
        HWPFDocument wordDocument = new HWPFDocument(input);
        WordToHtmlConverter wordToHtmlConverter = new WordToHtmlConverter(DocumentBuilderFactory.newInstance().newDocumentBuilder().newDocument());
        //解析word文档
        wordToHtmlConverter.processDocument(wordDocument);
        Document htmlDocument = wordToHtmlConverter.getDocument();
        File htmlFile = new File(filePath + htmlName);
        OutputStream outStream = new FileOutputStream(htmlFile);
        DOMSource domSource = new DOMSource(htmlDocument);
        StreamResult streamResult = new StreamResult(outStream);
        TransformerFactory factory = TransformerFactory.newInstance();
        Transformer serializer = factory.newTransformer();
        serializer.setOutputProperty(OutputKeys.ENCODING, "utf-8");
        serializer.setOutputProperty(OutputKeys.INDENT, "yes");
        serializer.setOutputProperty(OutputKeys.METHOD, "html");
        serializer.transform(domSource, streamResult);
        outStream.close();