java将word转换为html(代码)

互联网 19-8-14
public static void main(String[] args) throws Exception {     String filePath = "C:/Users/Administrator/Desktop/92个诊疗方案及临床路径/";     File file = new File(filePath);     File[] files = file.listFiles();     String name = null;     for (File file2 : files) {         Thread.sleep(500);         name = file2.getName().substring(0, file2.getName().lastIndexOf("."));         System.out.println(file2.getName());         if (file2.getName().endsWith(".docx") || file2.getName().endsWith(".DOCX")) {             CaseHtm.docx(filePath ,file2.getName(),name +".htm");         }else{             CaseHtm.dox(filePath ,file2.getName(),name +".htm");         }          } } /** * 转换docx * @param filePath * @param fileName * @param htmlName * @throws Exception */ public static void docx(String filePath ,String fileName,String htmlName) throws Exception{     final String file = filePath + fileName;     File f = new File(file);       // ) 加载word文档生成 XWPFDocument对象     InputStream in = new FileInputStream(f);     XWPFDocument document = new XWPFDocument(in);     // ) 解析 XHTML配置 (这里设置IURIResolver来设置图片存放的目录)     File imageFolderFile = new File(filePath);     XHTMLOptions options = XHTMLOptions.create().URIResolver(new FileURIResolver(imageFolderFile));     options.setExtractor(new FileImageExtractor(imageFolderFile));     options.setIgnoreStylesIfUnused(false);     options.setFragment(true);     // ) 将 XWPFDocument转换成XHTML     OutputStream out = new FileOutputStream(new File(filePath + htmlName));     XHTMLConverter.getInstance().convert(document, out, options); } /** * 转换doc * @param filePath * @param fileName * @param htmlName * @throws Exception */ public static void dox(String filePath ,String fileName,String htmlName) throws Exception{     final String file = filePath + fileName;     InputStream input = new FileInputStream(new File(file));     HWPFDocument wordDocument = new HWPFDocument(input);     WordToHtmlConverter wordToHtmlConverter = new WordToHtmlConverter(DocumentBuilderFactory.newInstance().newDocumentBuilder().newDocument());     //解析word文档     wordToHtmlConverter.processDocument(wordDocument);     Document htmlDocument = wordToHtmlConverter.getDocument();          File htmlFile = new File(filePath + htmlName);     OutputStream outStream = new FileOutputStream(htmlFile);          DOMSource domSource = new DOMSource(htmlDocument);     StreamResult streamResult = new StreamResult(outStream);          TransformerFactory factory = TransformerFactory.newInstance();     Transformer serializer = factory.newTransformer();     serializer.setOutputProperty(OutputKeys.ENCODING, "utf-8");     serializer.setOutputProperty(OutputKeys.INDENT, "yes");     serializer.setOutputProperty(OutputKeys.METHOD, "html");          serializer.transform(domSource, streamResult);     outStream.close(); }

pom.xml配置:

<dependency>     <groupId>fr.opensagres.xdocreport</groupId>     <artifactId>fr.opensagres.xdocreport.document</artifactId>     <version>1.0.5</version> </dependency> <dependency>       <groupId>fr.opensagres.xdocreport</groupId>       <artifactId>org.apache.poi.xwpf.converter.xhtml</artifactId>       <version>1.0.5</version>   </dependency>     <dependency>     <groupId>org.apache.poi</groupId>     <artifactId>poi</artifactId>     <version>3.12</version> </dependency> <dependency>     <groupId>org.apache.poi</groupId>     <artifactId>poi-scratchpad</artifactId>     <version>3.12</version> </dependency>

以上就是java将word转换为html(代码)的详细内容,更多内容请关注技术你好其它相关文章!

来源链接:
免责声明:
1.资讯内容不构成投资建议,投资者应独立决策并自行承担风险
2.本文版权归属原作所有,仅代表作者本人观点,不代表本站的观点或立场
标签: java
上一篇:php获取远程图片并下载保存到本地的方法分析 下一篇:Java基础:多态的理解与应用

相关资讯