Java实现将word转换为html的方法示例【doc与docx格式】

本文实例讲述了java实现将word转换为html的方法。分享给大家供大家参考，具体如下：

								
									 public   static   void   main(string[] args)   throws   exception { 

									 string filepath =   "c:/users/administrator/desktop/92个诊疗方案及临床路径/"  ; 

									 file file =   new   file(filepath); 

									 file[] files = file.listfiles(); 

									 string name =   null  ; 

									 for   (file file2 : files) { 

									    thread.sleep(  500  ); 

									    name = file2.getname().substring(  0  , file2.getname().lastindexof(  "."  )); 

									    system.out.println(file2.getname()); 

									    if   (file2.getname().endswith(  ".docx"  ) || file2.getname().endswith(  ".docx"  )) { 

									    casehtm.docx(filepath ,file2.getname(),name +  ".htm"  ); 

									    }  else  { 

									    casehtm.dox(filepath ,file2.getname(),name +  ".htm"  ); 

									    } 

									      } 

									 } 

									 /** 

									 * 转换docx 

									 * @param filepath 

									 * @param filename 

									 * @param htmlname 

									 * @throws exception 

									 */ 

									 public   static   void   docx(string filepath ,string filename,string htmlname)   throws   exception{ 

									 final   string file = filepath + filename; 

									 file f =   new   file(file);  

									 // ) 加载word文档生成 xwpfdocument对象 

									 inputstream in =   new   fileinputstream(f); 

									 xwpfdocument document =   new   xwpfdocument(in); 

									 // ) 解析 xhtml配置 (这里设置iuriresolver来设置图片存放的目录) 

									 file imagefolderfile =   new   file(filepath); 

									 xhtmloptions options = xhtmloptions.create().uriresolver(  new   fileuriresolver(imagefolderfile)); 

									 options.setextractor(  new   fileimageextractor(imagefolderfile)); 

									 options.setignorestylesifunused(  false  ); 

									 options.setfragment(  true  ); 

									 // ) 将 xwpfdocument转换成xhtml 

									 outputstream out =   new   fileoutputstream(  new   file(filepath + htmlname)); 

									 xhtmlconverter.getinstance().convert(document, out, options); 

									 } 

									 /** 

									 * 转换doc 

									 * @param filepath 

									 * @param filename 

									 * @param htmlname 

									 * @throws exception 

									 */ 

									 public   static   void   dox(string filepath ,string filename,string htmlname)   throws   exception{ 

									      final   string file = filepath + filename; 

									      inputstream input =   new   fileinputstream(  new   file(file)); 

									      hwpfdocument worddocument =   new   hwpfdocument(input); 

									      wordtohtmlconverter wordtohtmlconverter =   new   wordtohtmlconverter(documentbuilderfactory.newinstance().newdocumentbuilder().newdocument()); 

									      //解析word文档 

									      wordtohtmlconverter.processdocument(worddocument); 

									      document htmldocument = wordtohtmlconverter.getdocument(); 

									      file htmlfile =   new   file(filepath + htmlname); 

									      outputstream outstream =   new   fileoutputstream(htmlfile); 

									      domsource domsource =   new   domsource(htmldocument); 

									      streamresult streamresult =   new   streamresult(outstream); 

									      transformerfactory factory = transformerfactory.newinstance(); 

									      transformer serializer = factory.newtransformer(); 

									      serializer.setoutputproperty(outputkeys.encoding,   "utf-8"  ); 

									      serializer.setoutputproperty(outputkeys.indent,   "yes"  ); 

									      serializer.setoutputproperty(outputkeys.method,   "html"  ); 

									      serializer.transform(domsource, streamresult); 

									      outstream.close(); 

									    }

								
									 <dependency> 

									     <groupid>fr.opensagres.xdocreport</groupid> 

									     <artifactid>fr.opensagres.xdocreport.document</artifactid> 

									     <version>  1.0  .  5  </version> 

									 </dependency> 

									 <dependency>  

									     <groupid>fr.opensagres.xdocreport</groupid>  

									     <artifactid>org.apache.poi.xwpf.converter.xhtml</artifactid>  

									     <version>  1.0  .  5  </version>  

									 </dependency> 

									     <dependency> 

									     <groupid>org.apache.poi</groupid> 

									     <artifactid>poi</artifactid> 

									     <version>  3.12  </version> 

									 </dependency> 

									 <dependency> 

									     <groupid>org.apache.poi</groupid> 

									     <artifactid>poi-scratchpad</artifactid> 

									     <version>  3.12  </version> 

									 </dependency>

希望本文所述对大家java程序设计有所帮助。

原文链接：https://blog.csdn.net/tangyaliang11/article/details/79007873

声明：本文来自网络，不代表【好得很程序员自学网】立场，转载请注明出处：http://www.haodehen.cn/did236113

更新时间：2023-05-23 阅读：37次