poi将word2007转换成html

作者: 烟雾袅绕 | 来源:发表于2016-07-20 11:23 被阅读1246次

    1:导入jar包依赖

           <dependency>
               <groupId>org.apache.poi</groupId>
               <artifactId>poi-scratchpad</artifactId>
               <version>3.10.1</version>
           </dependency>
          <dependency>
               <groupId>org.apache.xmlbeans</groupId>
               <artifactId>xmlbeans</artifactId>
               <version>2.6.0</version>
          </dependency>
          <dependency>
               <groupId>fr.opensagres.xdocreport</groupId>
               <artifactId>org.apache.poi.xwpf.converter.core</artifactId>
               <version>1.0.6</version>
          </dependency>
          <dependency>
               <groupId>fr.opensagres.xdocreport</groupId>
               <artifactId>org.apache.poi.xwpf.converter.xhtml</artifactId>
               <version>1.0.6</version>
           </dependency>       
    

    2:创建工具类,便于后面直接调用即可

    import java.io.File;
    import java.io.FileInputStream;
    import java.io.FileOutputStream;
    import java.io.IOException;
    import java.io.InputStream;
    import java.io.OutputStream;
    
    import org.apache.poi.xwpf.converter.core.FileImageExtractor;
    import org.apache.poi.xwpf.converter.core.FileURIResolver;
    import org.apache.poi.xwpf.converter.xhtml.XHTMLConverter;
    import org.apache.poi.xwpf.converter.xhtml.XHTMLOptions;
    import org.apache.poi.xwpf.usermodel.XWPFDocument;
    
    public class WordtoHtml07 {
       
       public static void word07ToHtml(String fileName ,String imageFile , String htmFile) throws IOException{
           File f = new File(fileName);
           if (!f.exists()) {
               System.out.println("sorry file does not exists");
           }else{
               if (f.getName().endsWith(".docx")|| f.getName().endsWith(".DOCX") || f.getName().endsWith(".doc")) {
                   //1:加载文档到XWPFDocument
                   InputStream in = new FileInputStream(f);
                   XWPFDocument document = new XWPFDocument(in);
                   //2:加载图片到指定文件夹
                   File imgFile = new File(imageFile);
                   XHTMLOptions options = XHTMLOptions.create().URIResolver(new FileURIResolver(imgFile));
                   options.setExtractor(new FileImageExtractor(imgFile));
                   
                   //3:转换XWPFDocument to XHTML 
                     OutputStream out = new FileOutputStream(new File(htmFile));  
                       XHTMLConverter.getInstance().convert(document, out, options);  
               }else{
                     System.out.println("Enter only MS Office 2007+ files");           
               }           
           }           
       }      
       public static void main(String args[]) {  
           try {           
               word07ToHtml("F:/51/1.doc","F:/51/media","F:/51/1.htm");
           } catch (IOException e) {  
               // TODO Auto-generated catch block  
               e.printStackTrace();  
           }  
       }   
    }
    

    附:简单的实现了word 转换成html ,欢迎各路大神补充在项目中遇到的其他需求,完善工具类的封装,谢谢

    相关文章

      网友评论

      • wolfies:代码能用,就是图片是绝对路径。
      • SmNiuhe:异常了:java.lang.NoSuchMethodError: org.apache.poi.POIXMLDocumentPart.getPackageRelationship()Lorg/apache/poi/openxml4j/opc/PackageRelationship; 是最新jar的原因吗?

      本文标题:poi将word2007转换成html

      本文链接:https://www.haomeiwen.com/subject/qosvjttx.html