java利用第三方jar实现excel,word,ppt,txt转pdf格式
最近项目有文件模块的上传预览功能,比如把word文档上传,以后点击可以预览。采用的思路为:文件上传到服务器,然后获取转换成对应的新的PDF文件,然后读取PDF文件。本文着重实现文档上传然后转为PDF。所需jar: https://pan.baidu.com/s/1AKBQuD4GPxQsxFomIi-sEQ 提取码: rzju
文件上传代码:
public String fileUpload(HttpServletRequest request, HttpServletResponse response) { String saveDirectory = request.getServletContext().getRealPath("/upload");//上传路径 // 将当前上下文初始化给 CommonsMutipartResolver (多部分解析器) CommonsMultipartResolver multipartResolver = new CommonsMultipartResolver( request.getSession().getServletContext()); if (multipartResolver.isMultipart(request)) { // 将request变成多部分request MultipartHttpServletRequest multiRequest = (MultipartHttpServletRequest) request; // 获取multiRequest 中所有的文件名 Iterator iter = multiRequest.getFileNames(); String extName = "";// 扩展名 while (iter.hasNext()) { // 一次遍历所有文件 MultipartFile file = multiRequest.getFile(iter.next().toString()); if (file != null) { try { InputStream is = file.getInputStream();
//获取文件md5值判断是否有重复,如果有文件就不上传,直接读取 String fileHashCode = MD5Util.md5HashCode32(is); String originalFileName = file.getOriginalFilename();
//获取扩展名 extName = originalFileName.substring(originalFileName.lastIndexOf(".")); //源文件上传地址
String sourceFilePath = saveDirectory + File.separator + fileHashCode + extName;
//生成的目标文件地址 String destinatFilePath = request.getServletContext.getRealPath("/convert")+File.separator+fileHashCode + ".pdf";
// 表示文件已存在不需要上传
if (new File(sourceFilePath).exists()) {
continue;//跳出本次循环 } else { file.transferTo(new File(path));// 生成新的文件 file.getInputStream().close();//流关最好在finally里关闭 // 文件转换工具用于转换文件,最好新开线程,对文件较大的需要等待时间。参数(源文件路径,目标文件路径) FileConvertUtils.convert(sourceFilePath, destinatFilePath); } } catch (Exception e) { // TODO Auto-generated catch block e.printStackTrace(); } } } return "请选择文件上传!"; } return "文件上传请求配置错误!"; }
定义函数用于判断调用哪个转换函数:
public class FileConvertUtils { public static final Logger log = LoggerFactory.getLogger(FileConvertUtils.class); public static void convert(final String sourceFilePath ,final String destFilePath){ String fileType = sourceFilePath.substring(sourceFilePath.lastIndexOf(".")); ExecutorService executor = Executors.newCachedThreadPool() ; executor.submit(() -> { try { //要执行的业务代码, if(!"".equals(fileType)&&fileType!=null){ if(".doc".equals(fileType)||".docx".equals(fileType)||".wps".equals(fileType)){ OfficeToPdfUtils.word2Pdf(sourceFilePath,destFilePath); }else if(".txt".equals(fileType)){ OfficeToPdfUtils.word2Pdf(sourceFilePath,destFilePath); }else if(".xls".equals(fileType)||".xlsx".equals(fileType)){ OfficeToPdfUtils.excel2Pdf(sourceFilePath,destFilePath); }else if(".ppt".equals(fileType)||".pptx".equals(fileType)){ OfficeToPdfUtils.ppt2Pdf(sourceFilePath,destFilePath); }else if(".pdf".equals(fileType)){ FileUtils.copyFile(sourceFilePath, destFilePath); } } }catch(Exception e) { e.printStackTrace(); throw new RuntimeException("报错啦!!"); } }); } }
文件转换核心代码:
package com.hhwy.fileview.convert; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import com.aspose.cells.Workbook; import com.aspose.pdf.SaveFormat; import com.aspose.slides.Presentation; import com.aspose.words.Document; import com.hhwy.fweb.framework.api.utils.IoTools; import java.io.FileInputStream; import java.io.FileOutputStream; import java.io.IOException; import java.io.InputStream; import java.io.*; public class OfficeToPdfUtils { /** * The constant LOG. * */ private static final Logger LOG = LoggerFactory.getLogger(OfficeToPdfUtils.class); /** * 获取license * * @return */ public static boolean getWordLicense() { boolean result = false; try { InputStream license = new FileInputStream(new File(IoTools.getABSPATH() + "WEB-INF/license.xml"));// license路径,这里我引用的是公司的包获取路径,这边自己可以定义指定路径 com.aspose.words.License aposeLic = new com.aspose.words.License(); aposeLic.setLicense(license); result = true; } catch (Exception e) { e.printStackTrace(); } return result; } public static boolean getPPTLicense() { boolean result = false; try { InputStream license = new FileInputStream(new File(IoTools.getABSPATH() + "WEB-INF/license.xml"));// license路径 com.aspose.slides.License aposeLic = new com.aspose.slides.License(); aposeLic.setLicense(license); result = true; } catch (Exception e) { e.printStackTrace(); } return result; } public static boolean getExcelLicense() { boolean result = false; try { InputStream license = new FileInputStream(new File(IoTools.getABSPATH() + "WEB-INF/license.xml"));// license路径 com.aspose.cells.License aposeLic = new com.aspose.cells.License(); aposeLic.setLicense(license); result = true; } catch (Exception e) { e.printStackTrace(); } return result; } public static void word2Pdf(String resourceFilePath, String destFilePath) { InputStream wordIn = null; try { wordIn = new FileInputStream(new File(resourceFilePath)); } catch (FileNotFoundException e) { e.printStackTrace(); } FileOutputStream fileOS = null; // 验证License if (!getWordLicense()) { LOG.error("验证License失败!"); return; } try { Document doc = new Document(wordIn); fileOS = new FileOutputStream(new File(destFilePath)); // 保存转换的pdf文件 doc.save(fileOS, com.aspose.words.SaveFormat.PDF); } catch (Exception e) { LOG.error("error:", e); } finally { try { if(fileOS != null){ fileOS.close(); } } catch (IOException e) { LOG.error("error:", e); } } } public static void ppt2Pdf(String resourceFilePath, String destFilePath){ InputStream wordIn = null; try { wordIn = new FileInputStream(new File(resourceFilePath)); } catch (FileNotFoundException e) { e.printStackTrace(); } FileOutputStream fileOS = null; // 验证License if (!getPPTLicense()) { LOG.error("验证License失败!"); return; } try { fileOS = new FileOutputStream(new File(destFilePath)); Presentation ppt = new Presentation(wordIn);
//此处不可写SaveFormat.Pdf,这样转换能生成文件,但是转换的文件无法打开 ppt.save(fileOS, com.aspose.slides.SaveFormat.Pdf); } catch (Exception e) { LOG.error("error:", e); } finally { try { if(fileOS != null){ fileOS.close(); } } catch (IOException e) { LOG.error("error:", e); } } }
public static void word2Html(String resourceFilePath, String destFilePath) { InputStream wordIn = null; try { wordIn = new FileInputStream(new File(resourceFilePath)); } catch (FileNotFoundException e) { e.printStackTrace(); } FileOutputStream fileOS = null; // 验证License if (!getWordLicense()) { LOG.error("验证License失败!"); return; } try { Document doc = new Document(wordIn); fileOS = new FileOutputStream(new File(destFilePath)); // 保存转换的pdf文件 doc.save(fileOS, com.aspose.words.SaveFormat.HTML); } catch (Exception e) { LOG.error("error:", e); } finally { try { if(fileOS != null){ fileOS.close(); } } catch (IOException e) { LOG.error("error:", e); } } } public static void excel2Pdf(String resourceFilePath, String destFilePath){ InputStream in = null; try { in = new FileInputStream(new File(resourceFilePath)); } catch (FileNotFoundException e) { e.printStackTrace(); } FileOutputStream fileOS = null; // 验证License if (!getExcelLicense()) { LOG.error("验证License失败!"); return; } try { fileOS = new FileOutputStream(new File(destFilePath)); Workbook excel = new Workbook(in); excel.save(destFilePath,com.aspose.cells.SaveFormat.PDF); } catch (Exception e) { LOG.error("error:", e); } finally { try { if(fileOS != null){ fileOS.close(); System.out.println("转换已完成!"); } } catch (IOException e) { LOG.error("error:", e); } } }
public static void main(String[] args) { word2Pdf("/Users/workspace/docs/test.docx","/Users/workspace/docs/test.pdf"); /* InputStream pptIn = new FileInputStream(new File("/Users/workspace/docs/test.pptx")); ppt2Pdf(pptIn,"/Users/workspace/docs/test-ppt.pdf"); InputStream excelIn = new FileInputStream(new File("/Users/workspace/docs/test.xlsx")); excel2Pdf(excelIn,"D:\\aspose\\test-excel.pdf"); InputStream txtIn = new FileInputStream(new File("/Users/workspace/docs/test.txt")); word2Pdf(txtIn,"/Users/workspace/docs/test-txt.pdf");*/ } }
本在实现上还有许多需要优化的地方,比如如何得知某文件何时转换成功,文件夹,文件不存在时候的判断等。后续优化后再更新。
针对无法获取文件何时转换成功,修改了FileConvertUtils 使其实现Callable接口,定义线程池在上传文件外部调用该类,代码:
public class FileConvertUtils implements Callable<Integer>{ private String sourceFilePath; private String destFilePath; FileConvertUtils(String sourceFilePath,String destFilePath){ this.sourceFilePath = sourceFilePath; this.destFilePath = destFilePath; } public void convert(String sourceFilePath,String destFilePath){ String fileType = sourceFilePath.substring(sourceFilePath.lastIndexOf(".")); try { //要执行的业务代码, if(!"".equals(fileType)&&fileType!=null){ if(".doc".equals(fileType)||".docx".equals(fileType)||".wps".equals(fileType)){ OfficeToPdfUtils.word2Pdf(sourceFilePath,destFilePath); }else if(".txt".equals(fileType)){ OfficeToPdfUtils.word2Pdf(sourceFilePath,destFilePath); }else if(".xls".equals(fileType)||".xlsx".equals(fileType)){ OfficeToPdfUtils.excel2Pdf(sourceFilePath,destFilePath); }else if(".ppt".equals(fileType)||".pptx".equals(fileType)){ OfficeToPdfUtils.ppt2Pdf(sourceFilePath,destFilePath); }else if(".pdf".equals(fileType)){ FileUtils.copyFile(sourceFilePath, destFilePath); } } }catch(Exception e) { e.printStackTrace(); throw new RuntimeException("报错啦!!"); } } @Override public Integer call() throws Exception { this.convert(sourceFilePath, destFilePath); return 1;//通过future.get可以获取改返回值,表示执行完成 }
调用处代码:
ExecutorService executor = Executors.newCachedThreadPool(); Future<Integer> future = executor.submit(new FileConvertUtils(sourceFilePath,destinatFilePath)); System.out.println("=================="+future.get());//如果返回1,则调用成功,否则get方法会一直阻塞。
增加ppt转图片操作方法:
/** * pptToImage * @param resourceFilePath * @param destFilePath */ public static void ppt2Image(String resourceFilePath,String destFilePath){ InputStream wordIn = null; try { wordIn = new FileInputStream(new File(resourceFilePath)); } catch (Exception e) { e.printStackTrace(); } FileOutputStream fileOS = null; //验证license if(!getPPTLicense()){ LOG.error("验证License失败!"); return; } try { Presentation ppt = new Presentation(wordIn); int i=0; for(;i<ppt.getSlides().size();i++){ ISlide slide = ppt.getSlides().get_Item(i); int hight = (int) (ppt.getSlideSize().getSize().getHeight()-150); int width = (int) (ppt.getSlideSize().getSize().getWidth()-150); BufferedImage image = slide.getThumbnail(new Dimension(width,hight)); //每页输出一张图片 File outImage = new File(destFilePath.replace(".pdf","")+i+".JPG"); ImageIO.write(image, "JPG", outImage); } } catch (Exception e) { e.printStackTrace(); } }