您的位置:首页 > Web前端 > HTML

利用jodconverter(基于OpenOffice服务)将word文件(*.doc)转化为html格式

2011-07-05 09:39 447 查看
package com.syni.im800.kb.common.util;

import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.net.ConnectException;
import java.text.SimpleDateFormat;
import java.util.Date;

import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;

import com.artofsolving.jodconverter.DocumentConverter;
import com.artofsolving.jodconverter.openoffice.connection.OpenOfficeConnection;
import com.artofsolving.jodconverter.openoffice.connection.SocketOpenOfficeConnection;
import com.artofsolving.jodconverter.openoffice.converter.OpenOfficeDocumentConverter;
import com.syni.im800.kb.config.AppConfig;

/**
* 利用jodconverter(基于OpenOffice服务)将word文件(*.doc)转化为html格式,
* 使用前请检查OpenOffice服务是否已经开启,
* OpenOffice进程名称:soffice.exe | soffice.bin
* @author linshutao
* */
public class Doc2HtmlUtil {

Log log = LogFactory.getLog(getClass());
private static Doc2HtmlUtil doc2HtmlUtil;

/**
* 获取Doc2HtmlUtil实例
* */
public static synchronized Doc2HtmlUtil getDoc2HtmlUtilInstance(){
if(doc2HtmlUtil == null){
doc2HtmlUtil = new Doc2HtmlUtil();
}
return doc2HtmlUtil;
}
/**
* 转换文件
* @param fromFileInputStream:
* */
public String doc2Html(InputStream fromFileInputStream, File toFileFolder){
String soffice_host = AppConfig.getProperty(AppConfig.SOFFICE_HOST_KEY);
String soffice_port = AppConfig.getProperty(AppConfig.SOFFICE_PORT_KEY);
log.debug("soffice_host:"+soffice_host+",soffice_port:"+soffice_port);

Date date = new Date();
SimpleDateFormat sdf =new SimpleDateFormat("yyyyMMddHHmmss");
String timesuffix = sdf.format(date);
String htmFileName = "htmlfile"+timesuffix+".html";
String docFileName = "docfile"+timesuffix+".doc";

File htmlOutputFile = new File(toFileFolder.toString()+File.separatorChar+htmFileName);
File docInputFile = new File(toFileFolder.toString()+File.separatorChar+docFileName);
log.debug("########htmlOutputFile:"+toFileFolder.toString()+File.pathSeparator+htmFileName);
/**
* 由fromFileInputStream构建输入文件
* */
try {
OutputStream os = new FileOutputStream(docInputFile);
int bytesRead = 0;
byte[] buffer = new byte[1024 * 8];
while ((bytesRead = fromFileInputStream.read(buffer)) != -1) {
os.write(buffer, 0, bytesRead);
}

os.close();
fromFileInputStream.close();
} catch (IOException e) {
log.error(e.getMessage(), e);
}

OpenOfficeConnection connection = new SocketOpenOfficeConnection(soffice_host,Integer.parseInt(soffice_port));
try {
connection.connect();
} catch (ConnectException e) {
System.err.println("文件转换出错,请检查OpenOffice服务是否启动。");
log.error(e.getMessage(), e);
}
// convert
DocumentConverter converter = new OpenOfficeDocumentConverter(connection);
converter.convert(docInputFile, htmlOutputFile);
connection.disconnect();
/*		File  htmlOutputFile_rn = new File
(htmlOutputFile.getAbsolutePath().substring(0,htmlOutputFile.getAbsolutePath().lastIndexOf("."))+".htm");
htmlOutputFile.renameTo(htmlOutputFile_rn);
return htmlOutputFile_rn.getName();*/

//转换完之后删除word文件
docInputFile.delete();
log.debug("删除上传文件:"+docInputFile.getName());
return htmFileName;
}

}
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: 
相关文章推荐