首页 > 开发 > Java > 正文

Java实现将word转换为html的方法示例【doc与docx格式】

2019-10-21 18:22:45
字体:
来源:转载
供稿:网友

本文实例讲述了html">Java实现将word转换为html的方法。分享给大家供大家参考,具体如下:

 public static void main(String[] args) throws Exception { String filePath = "C:/Users/Administrator/Desktop/92个诊疗方案及临床路径/"; File file = new File(filePath); File[] files = file.listFiles(); String name = null; for (File file2 : files) {  Thread.sleep(500);  name = file2.getName().substring(0, file2.getName().lastIndexOf("."));  System.out.println(file2.getName());  if (file2.getName().endsWith(".docx") || file2.getName().endsWith(".DOCX")) {  CaseHtm.docx(filePath ,file2.getName(),name +".htm");  }else{  CaseHtm.dox(filePath ,file2.getName(),name +".htm");  }      } } /** * 转换docx * @param filePath * @param fileName * @param htmlName * @throws Exception */ public static void docx(String filePath ,String fileName,String htmlName) throws Exception{ final String file = filePath + fileName; File f = new File(file);  // ) 加载word文档生成 XWPFDocument对象 InputStream in = new FileInputStream(f); XWPFDocument document = new XWPFDocument(in); // ) 解析 XHTML配置 (这里设置IURIResolver来设置图片存放的目录) File imageFolderFile = new File(filePath); XHTMLOptions options = XHTMLOptions.create().URIResolver(new FileURIResolver(imageFolderFile)); options.setExtractor(new FileImageExtractor(imageFolderFile)); options.setIgnoreStylesIfUnused(false); options.setFragment(true); // ) 将 XWPFDocument转换成XHTML OutputStream out = new FileOutputStream(new File(filePath + htmlName)); XHTMLConverter.getInstance().convert(document, out, options); } /** * 转换doc * @param filePath * @param fileName * @param htmlName * @throws Exception */ public static void dox(String filePath ,String fileName,String htmlName) throws Exception{    final String file = filePath + fileName;    InputStream input = new FileInputStream(new File(file));    HWPFDocument wordDocument = new HWPFDocument(input);    WordToHtmlConverter wordToHtmlConverter = new WordToHtmlConverter(DocumentBuilderFactory.newInstance().newDocumentBuilder().newDocument());    //解析word文档    wordToHtmlConverter.processDocument(wordDocument);    Document htmlDocument = wordToHtmlConverter.getDocument();    File htmlFile = new File(filePath + htmlName);    OutputStream outStream = new FileOutputStream(htmlFile);    DOMSource domSource = new DOMSource(htmlDocument);    StreamResult streamResult = new StreamResult(outStream);    TransformerFactory factory = TransformerFactory.newInstance();    Transformer serializer = factory.newTransformer();    serializer.setOutputProperty(OutputKeys.ENCODING, "utf-8");    serializer.setOutputProperty(OutputKeys.INDENT, "yes");    serializer.setOutputProperty(OutputKeys.METHOD, "html");    serializer.transform(domSource, streamResult);    outStream.close();  }
<dependency>  <groupId>fr.opensagres.xdocreport</groupId>  <artifactId>fr.opensagres.xdocreport.document</artifactId>  <version>1.0.5</version></dependency><dependency>   <groupId>fr.opensagres.xdocreport</groupId>   <artifactId>org.apache.poi.xwpf.converter.xhtml</artifactId>   <version>1.0.5</version> </dependency>  <dependency>  <groupId>org.apache.poi</groupId>  <artifactId>poi</artifactId>  <version>3.12</version></dependency><dependency>  <groupId>org.apache.poi</groupId>  <artifactId>poi-scratchpad</artifactId>  <version>3.12</version></dependency>

 

希望本文所述对大家java程序设计有所帮助。


注:相关教程知识阅读请移步到JAVA教程频道。
发表评论 共有条评论
用户名: 密码:
验证码: 匿名发表