Java实现将word转换为html的方法示例【doc与docx格式】

本文实例讲述了Java实现将word转换为html的方法。分享给大家供大家参考,具体如下:

public static void main(String[] args) throws Exception {

String filePath = "C:/Users/Administrator/Desktop/92个诊疗方案及临床路径/";

File file = new File(filePath);

File[] files = file.listFiles();

String name = null;

for (File file2 : files) {

Thread.sleep(500);

name = file2.getName().substring(0, file2.getName().lastIndexOf("."));

System.out.println(file2.getName());

if (file2.getName().endsWith(".docx") || file2.getName().endsWith(".DOCX")) {

CaseHtm.docx(filePath ,file2.getName(),name +".htm");

}else{

CaseHtm.dox(filePath ,file2.getName(),name +".htm");

}

}

}

/**

* 转换docx

* @param filePath

* @param fileName

* @param htmlName

* @throws Exception

*/

public static void docx(String filePath ,String fileName,String htmlName) throws Exception{

final String file = filePath + fileName;

File f = new File(file);

// ) 加载word文档生成 XWPFDocument对象

InputStream in = new FileInputStream(f);

XWPFDocument document = new XWPFDocument(in);

// ) 解析 XHTML配置 (这里设置IURIResolver来设置图片存放的目录)

File imageFolderFile = new File(filePath);

XHTMLOptions options = XHTMLOptions.create().URIResolver(new FileURIResolver(imageFolderFile));

options.setExtractor(new FileImageExtractor(imageFolderFile));

options.setIgnoreStylesIfUnused(false);

options.setFragment(true);

// ) 将 XWPFDocument转换成XHTML

OutputStream out = new FileOutputStream(new File(filePath + htmlName));

XHTMLConverter.getInstance().convert(document, out, options);

}

/**

* 转换doc

* @param filePath

* @param fileName

* @param htmlName

* @throws Exception

*/

public static void dox(String filePath ,String fileName,String htmlName) throws Exception{

final String file = filePath + fileName;

InputStream input = new FileInputStream(new File(file));

HWPFDocument wordDocument = new HWPFDocument(input);

WordToHtmlConverter wordToHtmlConverter = new WordToHtmlConverter(DocumentBuilderFactory.newInstance().newDocumentBuilder().newDocument());

//解析word文档

wordToHtmlConverter.processDocument(wordDocument);

Document htmlDocument = wordToHtmlConverter.getDocument();

File htmlFile = new File(filePath + htmlName);

OutputStream outStream = new FileOutputStream(htmlFile);

DOMSource domSource = new DOMSource(htmlDocument);

StreamResult streamResult = new StreamResult(outStream);

TransformerFactory factory = TransformerFactory.newInstance();

Transformer serializer = factory.newTransformer();

serializer.setOutputProperty(OutputKeys.ENCODING, "utf-8");

serializer.setOutputProperty(OutputKeys.INDENT, "yes");

serializer.setOutputProperty(OutputKeys.METHOD, "html");

serializer.transform(domSource, streamResult);

outStream.close();

}

<dependency>

<groupId>fr.opensagres.xdocreport</groupId>

<artifactId>fr.opensagres.xdocreport.document</artifactId>

<version>1.0.5</version>

</dependency>

<dependency>

<groupId>fr.opensagres.xdocreport</groupId>

<artifactId>org.apache.poi.xwpf.converter.xhtml</artifactId>

<version>1.0.5</version>

</dependency>

<dependency>

<groupId>org.apache.poi</groupId>

<artifactId>poi</artifactId>

<version>3.12</version>

</dependency>

<dependency>

<groupId>org.apache.poi</groupId>

<artifactId>poi-scratchpad</artifactId>

<version>3.12</version>

</dependency>

更多关于java算法相关内容感兴趣的读者可查看本站专题:《Java文件与目录操作技巧汇总》、《Java数据结构与算法教程》、《Java操作DOM节点技巧总结》和《Java缓存操作技巧汇总》

希望本文所述对大家java程序设计有所帮助。

以上是 Java实现将word转换为html的方法示例【doc与docx格式】 的全部内容, 来源链接: utcz.com/z/336415.html

回到顶部