使用libreOffice(jodconverter)将office(ppt,Excel,word,text)文档转换成pdf

  • 使用libreOffice比使用OpenOffice转换稳定,libreOffice是OpenOffice的升级版本,但也不能完全盖晗OpenOffice,下面代码注释的部分即为OpenOffice将文档转换成PDF,使用libreOffice/OpenOffice都必须安装对应系统的libreOffice/OpenOffice软件。
package com.frank.demo.file.common.util;



import java.io.ByteArrayOutputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.util.UUID;


import org.artofsolving.jodconverter.OfficeDocumentConverter;
import org.artofsolving.jodconverter.office.DefaultOfficeManagerConfiguration;
import org.artofsolving.jodconverter.office.ExternalOfficeManagerConfiguration;
import org.artofsolving.jodconverter.office.OfficeManager;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.data.mongodb.core.query.Criteria;
import org.springframework.data.mongodb.core.query.Query;
import org.springframework.data.mongodb.gridfs.GridFsTemplate;
import org.springframework.stereotype.Component;


import com.lowagie.text.Document;
import com.lowagie.text.Image;
import com.lowagie.text.Rectangle;
import com.lowagie.text.pdf.PdfWriter;
import com.mongodb.gridfs.GridFSDBFile;

@Component
public class FlieToPdfUtilTwo {

	@Autowired
	private GridFsTemplate fileRepository;

	// private static String openOfficePath = "C:\\Program Files
	// (x86)\\OpenOffice 4"; 
	// openoffice软件的安装默认路径
	private static String libreOfficePath = "C:\\Program Files\\LibreOffice 5";
	// libreOffice软件的安装默认路径
	// 记录日志信息
	private static Logger logger = LoggerFactory.getLogger(FlieToPdfUtilTwo.class);

public ByteArrayOutputStream fileToPdf(String fileId) throws Exception {
	GridFSDBFile gridFSDBFile = fileRepository.findOne(new Query(Criteria.where("_id").is(fileId)));
	if (null != gridFSDBFile) {
		String type = this.getFileSufix(gridFSDBFile.getFilename());
		String folder = System.getProperty("java.io.tmpdir");
		String docs[] = { "doc", "docx", "ppt", "pptx", "xls", "xlsx", "txt" };
		String imgs[] = { "jpg", "png", "jpeg", "gif" };
		if (this.isExsitArry(type, imgs)) {
			StringBuffer filePath = new StringBuffer();
			String name = this.generateToken();
			filePath.append(folder);
			filePath.append(name);
			filePath.append("." + type);
			this.readFile(gridFSDBFile, filePath.toString());
			StringBuffer pdfPath = new StringBuffer();
			pdfPath.append(folder);
			pdfPath.append(name);
			pdfPath.append(".pdf");
			this.imgToPDF(filePath.toString(), pdfPath.toString());
			return this.getBytes(pdfPath.toString());
		} else if (this.isExsitArry(type, docs)) {
			StringBuffer filePath = new StringBuffer();
			String name = this.generateToken();
			filePath.append(folder);
			filePath.append(name);
			filePath.append("." + type);
			this.readFile(gridFSDBFile, filePath.toString());
			StringBuffer pdfPath = new StringBuffer();
			pdfPath.append(folder);
			pdfPath.append(name);
			pdfPath.append(".pdf");
			this.libreOfficeToPDF(filePath.toString(), pdfPath.toString());
			return this.getBytes(pdfPath.toString());
		} else {
			InputStream is = gridFSDBFile.getInputStream();
			ByteArrayOutputStream baos = new ByteArrayOutputStream();
			byte[] buffer = new byte[1024];
			int len;
			while ((len = is.read(buffer)) > -1) {
				baos.write(buffer, 0, len);
			}
			is.close();
			baos.flush();
			return baos;
		}
	} else {
		throw new Exception("文件不存在!");
	}
}

/**
* 检测元素是否存在数组中 不区分大小写
* 
* @param chex
* @param arry
* @return 存在 true 不存在 false
*/
public boolean isExsitArry(String chex, String arry[]) {
	for (String ex : arry) {
		if (chex.equalsIgnoreCase(ex)) {
			return true;
		}
	}
	return false;
}

/**
* 删除单个文件
* 
* @param sPath
*            被删除文件的文件名
* @return 单个文件删除成功返回true,否则返回false
*/
public boolean deleteFile(String sPath) {
	boolean flag = false;
	File file = new File(sPath);
	// 路径为文件且不为空则进行删除
	if (file.isFile() && file.exists()) {
		file.delete();
		flag = true;
	}
	return flag;
}

/**
* 写入当前文件
*/
public void readFile(GridFSDBFile gridFSDBFile, String filePath) throws Exception {
	InputStream is = gridFSDBFile.getInputStream();
	FileOutputStream os = new FileOutputStream(filePath);
	int index = 0;
	while ((index = is.read()) != -1) {
		os.write(index);
	}
	is.close();
	os.close();
}

/**
* 获取pdf文件输出流
*/
public ByteArrayOutputStream getBytes(String filePath) {
	File file = new File(filePath);
	ByteArrayOutputStream out = null;
	try {
		FileInputStream in = new FileInputStream(file);
		out = new ByteArrayOutputStream();
		byte[] b = new byte[1024];
		while ((in.read(b)) != -1) {
			out.write(b, 0, b.length);
		}
		out.close();
		in.close();
	} catch (FileNotFoundException e) {
		e.printStackTrace();
	} catch (IOException e) {
		e.printStackTrace();
	}
	this.deleteFile(filePath.toString());
	return out;
}

/**
* 获取随机名称
*/
public String generateToken() throws Exception {
	return UUID.randomUUID().toString().replace("-", "");
}

/***
* 判断文件类型
* 
* @param fileName
* @return
*/
public String getFileSufix(String fileName) {
	int splitIndex = fileName.lastIndexOf(".");
	return fileName.substring(splitIndex + 1);
}

/**
* office转PDF
*/
/*
* private void officeToPDF(String inputFiles, String pdfFile) {
* 		OpenOfficeConnection connection = new
* SocketOpenOfficeConnection("127.0.0.1", 8100); Process pro = null;
* 		BufferedReader br = null; try { File inputFile = new File(inputFiles);
*  		// 如果目标路径不存在, 则新建该路径 
* 		File outputFile = new File(pdfFile); 
* 		if (!outputFile.getParentFile().exists()) {
* 			outputFile.getParentFile().mkdirs(); 
* 		} 
* 		String OpenOffice_HOME = openOfficePath;
* 		// 这里是OpenOffice的安装目录 
*		 // 如果从文件中读取的URL地址最后一个字符不是 '\',则添加'\'
* 		if (OpenOffice_HOME.charAt(OpenOffice_HOME.length() - 1) != '\\') {
* 			OpenOffice_HOME += "\\"; 
*		} 
* 		// 启动OpenOffice的服务 
*		String command=OpenOffice_HOME+"program/soffice.exe -headless accept=\"socket,host=127.0.0.1,port=8100;urp;\" -nofirststartwizard"; 
* 		boolean flag = false; 
* 		// 取出所有的进程 
* 		Process proc = Runtime.getRuntime().exec("tasklist"); 
* 		br = new BufferedReader(new
* 		InputStreamReader(proc.getInputStream())); 
* 		String line; 
* 		while ((line = br.readLine()) != null) {
*  			if (line.indexOf("soffice.exe") != -1) { 
*				 flag = true;
* 			} 
* 		} 
* 		pro = Runtime.getRuntime().exec(command); 
* 		// 判断如果存在进程就不启进程 
*		 if(!flag) { 
*			connection.connect(); 
*		} 
* 		// convert 
* 		DocumentConverter converter  = new OpenOfficeDocumentConverter(connection);
*		converter.convert(inputFile, outputFile); 
* 		} catch (ConnectException e) {
*			logger.info(e.getMessage());
*  			e.printStackTrace(); 
* 		} catch (IOException e)  {
*  			logger.info(e.getMessage());
*  			// TODO Auto-generated catch block
* 			e.printStackTrace(); 
* 		} catch (Exception e) { 
* 			logger.info(e.getMessage());
* 			e.printStackTrace();
*  		} finally {
*  			if (br != null) {
*  				try { 
* 					br.close(); 
* 				}catch (Exception e) { 
* 					e.printStackTrace();
*  				} 
* 			} 
* 			// close the connection
* 			connection.disconnect(); 
*			 // 关闭OpenOffice服务的进程 
* 			pro.destroy(); 
* 		} 
* }
*/

/**
* 利用libreOffice将office doc文档转换成pdf
*/
private void libreOfficeToPDF(String inputFile, String pdfFile) {
	// 先启动已存在的LibreOffice服务
	OfficeManager officeManager = null;
	officeManager = this.startExsitLibreOffice(officeManager);
	try {
		OfficeDocumentConverter converter = new OfficeDocumentConverter(officeManager);
		File inputFiles = new File(inputFile);
		File outputFile = new File(pdfFile);
		converter.convert(inputFiles, outputFile);
	} catch (Exception e) {
		e.printStackTrace();
		logger.info("libreOfficeToPDF异常:" + e.getMessage());
	}
}

private OfficeManager startExsitLibreOffice(OfficeManager officeManager) {
	logger.info("准备启动服务....");
	try {
		logger.info("尝试连接已启动的服务...");
		ExternalOfficeManagerConfiguration externalProcessOfficeManager = new 			  		ExternalOfficeManagerConfiguration();
		externalProcessOfficeManager.setConnectOnStart(true);
		externalProcessOfficeManager.setPortNumber(8200);
		officeManager = externalProcessOfficeManager.buildOfficeManager();
		officeManager.start();
		logger.info("office转换服务启动成功!");
	} catch (Exception ex) {
		logger.info("没有已启动的服务..." + ex.getMessage());
		try {
			logger.info("正在启动office转换服务……");
			DefaultOfficeManagerConfiguration configuration = new 		DefaultOfficeManagerConfiguration();
			// libreOffice的安装目录
			configuration.setOfficeHome(new File(libreOfficePath));
			// configuration.setOfficeHome(libreOfficePath);
			// 端口号
			configuration.setMaxTasksPerProcess(100);
			configuration.setPortNumber(8200);
			configuration.setTaskExecutionTimeout(1000 * 60 * 5L);
			configuration.setTaskQueueTimeout(1000 * 60 * 60 * 24L);
			officeManager = configuration.buildOfficeManager();
			officeManager.start();
			logger.info("office转换服务启动成功!");
			} catch (Exception e) {
				logger.info("LibreOffice服务启动异常:" + e.getMessage());
			}
	}
	return officeManager;
}

private void imgToPDF(String imgFilePath, String pdfFilePath) {
	File file = new File(imgFilePath);
	if (file.exists()) {
		Document document = null;
		FileOutputStream fos = null;
		try {
			// 读取一个图片
			Image image = Image.getInstance(imgFilePath);
			float imageHeight = image.getScaledHeight();
			float imageWidth = image.getScaledWidth();
			int i = 0;
			while (imageHeight > 500 || imageWidth > 500) {
				image.scalePercent(100 - i);
				i++;
				imageHeight = image.getScaledHeight();
				imageWidth = image.getScaledWidth();
			}
			image.setAlignment(Image.ALIGN_CENTER);
			// 文档页面宽高为图片宽高
			Rectangle rect = new Rectangle(imageWidth, imageHeight);
			document = new Document(rect);
			// 读取文件流,创建可读写的文件
			fos = new FileOutputStream(pdfFilePath);
			PdfWriter.getInstance(document, fos);
			// 设置文档边距
			document.setMargins(0, 0, 0, 0);
			// 打开文档
			document.open();
			// 插入一个图片
			document.add(image);
		} catch (Exception e) {
			e.printStackTrace();
		} 
		document.close();
		try {
			fos.flush();
			fos.close();
		} catch (IOException e) {
			e.printStackTrace();
		}
	}
}

}

你可能感兴趣的:(Java)