您的位置:首页 > Web前端 > HTML

C#实现将PPT转换成HTML的方法

2014-08-07 10:57 1001 查看

本文是一个C#的小程序,主要实现将ppt转换成html的功能,方法很多,此处与大家分享一下,希望能对大家的项目开发起到一定的借鉴作用。

主要功能代码如下:

using System;
using System.Collections.Generic;
using System.Text;
using System.IO;
using PPT = Microsoft.Office.Interop.PowerPoint;
using System.Reflection;
namespace WritePptDemo
{
class Program
{
static void Main(string[] args)
{
string  path;     //文件路径变量
PPT.Application pptApp;   //Excel应用程序变量
PPT.Presentation pptDoc;   //Excel文档变量
PPT.Presentation pptDoctmp;
path  = @"C:\MyPPT.ppt";   //路径
pptApp =  new PPT.ApplicationClass();  //初始化
//如果已存在,则删除
if  (File.Exists((string)path))
{
File.Delete((string)path);
}
//由于使用的是COM库,因此有许多变量需要用Nothing代替
Object  Nothing = Missing.Value;
pptDoc =  pptApp.Presentations.Add(Microsoft.Office.Core.MsoTriState.msoFalse);
pptDoc.Slides.Add(1,  Microsoft.Office.Interop.PowerPoint.PpSlideLayout.ppLayoutText);
string text = "示例文本";
foreach  (PPT.Slide slide in pptDoc.Slides)
{
foreach (PPT.Shape shape in slide.Shapes)
{
shape.TextFrame.TextRange.InsertAfter(text);
}
}
//WdSaveFormat为Excel文档的保存格式
PPT.PpSaveAsFileType format = PPT.PpSaveAsFileType.ppSaveAsDefault;
//将excelDoc文档对象的内容保存为XLSX文档
pptDoc.SaveAs(path, format, Microsoft.Office.Core.MsoTriState.msoFalse);
//关闭excelDoc文档对象
pptDoc.Close();
//关闭excelApp组件对象
pptApp.Quit();
Console.WriteLine(path + " 创建完毕!");
Console.ReadLine();
string  pathHtml = @"c:\MyPPT.html";
PPT.Application pa = new PPT.ApplicationClass();
pptDoctmp = pa.Presentations.Open(path,  Microsoft.Office.Core.MsoTriState.msoTrue,  Microsoft.Office.Core.MsoTriState.msoFalse,  Microsoft.Office.Core.MsoTriState.msoFalse);
PPT.PpSaveAsFileType formatTmp = PPT.PpSaveAsFileType.ppSaveAsHTML;
pptDoctmp.SaveAs(pathHtml, formatTmp,  Microsoft.Office.Core.MsoTriState.msoFalse);
pptDoctmp.Close();
pa.Quit();
Console.WriteLine(pathHtml + " 创建完毕!");
}
}
}

以上程序是使用C# 先创建一个ppt 文件并向里面写入了文字,然后再把此ppt 转换成html  ,对于上面程序需要说明的其实就是

引用dll的问题, 在项目中添加引用,在com 组件中选择 microsoft powerpoint 11.0 object   library ,而如果你的电脑没有安装 office 2003 是不会有这个的,而如果安装的是office 2007 则是microsoft powerpoint 12.0 object   library。而且即使你引用成功后,还是会编译不通过,是因为少安装了 office   PIA  ,在安装office 时,如果你是选择的典型安装是不会安装这个的,因为这个只针对开发人员才会用到。可以到网上下载一个 office PIA 安装下就ok了
 
Office文件转换成Html格式功能代码如下:  

using  Microsoft.Office.Core;
using Microsoft.Office.Interop.PowerPoint;
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.Web;
using System.IO;
using System.Text.RegularExpressions;
using Nd.Webs;
using Aspose.Cells;
using Aspose.Words;
using ND.CommonHelper;
using Microsoft.Office.Interop.PowerPoint;
using Microsoft.Office.Core;
namespace Api.Note.Base
{
#region Office文件转换成Html格式
class OfficeHtmlBo
{
#region InsertHeadHtml
/// <summary>
/// InsertHeadHtml
/// </summary>
/// <param  name="WordFilePath">InsertHeadHtml</param>
private string  InsertHeadHtml(string strHtml, string realPath)
{
int index  = strHtml.IndexOf("<body");
strHtml =  strHtml.Insert(index, "<div  style='height:60px;font-size:14px;margin:0px 0px  12px 0px;padding:14px 4px 12px 12px;line-height:24px;height:1%;'>以下是该文档的HTML预览效果。<br/><span>由于是网页提取显示word中的内容,有可能部分显示与源文档中有差异,如想查看更准确的信息,</span>您可以点击 <a  style='color:6699FF;text-decoration:underline;'  href='/Lib/UdControls/Download.aspx?action=Download&appFormCode=" +  HttpContext.Current.Request.QueryString["appFormCode"].ToString() +  "&path=" +  HttpContext.Current.Request.QueryString["path"].ToString() +  "&encrypt=" + HttpContext.Current.Request.QueryString["encrypt"].ToString()  + "'><b>下载原始附件</b></a></div>");
Regex  reg = new  Regex(@"(?<start><img[^>]+?src="")(?<src>[^""]+?)(?<end>""[^>]+?>)");
strHtml =  reg.Replace(strHtml, delegate(Match m)
{
return string.Format("{0}{1}{2}{3}",
m.Groups["start"].Value,
realPath,
m.Groups["src"].Value,
m.Groups["end"].Value
);
});
return strHtml;
}
#endregion
#region GetLeftStr
/// <summary>
/// 截取字符串左边指定长度
/// </summary>
/// <param  name="str"></param>
/// <param  name="length"></param>
///  <returns></returns>
public string GetLeftStr(string  str, int length)
{
length =  length * 2;
string  tempStr = "";
int i = 0;
foreach  (char c in str)
{
tempStr += c.ToString();
if (((int)c >= 33) && ((int)c <= 126))
{
//字母和符号原样保留
i += 1;
}
else
{
i += 2;
}
if (i >= length)
{
return tempStr;
}
}
return  str;
}
#endregion
#region 将Word文档转换成HTML格式
/// <summary>
/// 将Word文档转换成HTML格式
/// </summary>
/// <param  name="WordFilePath">Word文档格式</param>
private void WordToHtmlFile(string  WordFilePath)
{
try
{
// 指定原文件和目标文件
string realPath = WordFilePath.Substring(0,  WordFilePath.LastIndexOf("/") + 1);
WordFilePath = System.Web.HttpContext.Current.Server.MapPath(WordFilePath);
object target = WordFilePath.Substring(0,  WordFilePath.LastIndexOf(".")) + ".html";
//string realPath = WordFilePath.Substring(0,  WordFilePath.LastIndexOf(".")) + ".html";
if (!File.Exists(target.ToString()))
{
Document doc = new Document(WordFilePath);
doc.Save(target.ToString(), SaveFormat.Html);
}
StreamReader sr = new StreamReader(target.ToString(), Encoding.Default);
string strHtml = sr.ReadToEnd();
strHtml = InsertHeadHtml(strHtml, realPath);
HttpContext.Current.Response.Write(strHtml);
sr.Close();
}
catch  (Exception ex)
{
//记录异常
LogEntry logEntry = new LogEntry();
logEntry.Message = ex.Message;
logEntry.Title = "---->将Word文档转换成HTML格式异常[WordToHtmlFile]";
logEntry.TimeStamp = DateTime.Now;
logEntry.LogEntryType = LogEntryType.Error;
logEntry.LogCatalog = LogCatalog.ExceptionLog;
logEntry.StackTrace = ex.StackTrace;
LogPosition logPosition = LogPosition.FileLog;
string positionParameter =  SysConfig.ToString(SysConfig.GetAppSetting("LogPath"));
SysLogger.Write(logEntry, logPosition, positionParameter);
}
}
#endregion
#region 将Excel文件转换成HTML格式
/// <summary>
/// 将Excel文件转换成HTML格式
/// </summary>
/// <param  name="ExcelFilePath">Excel文件路径</param>
private void  ExcelToHtmlFile(string ExcelFilePath)
{
try
{
string realPath = ExcelFilePath.Substring(0,  ExcelFilePath.LastIndexOf("/") + 1);
int index = ExcelFilePath.LastIndexOf("/");
string fileName;
if (ExcelFilePath.IndexOf(":") != -1)
{
fileName = ExcelFilePath.Split(new char[] { ':' })[0].ToString();
fileName = GetLeftStr(fileName.Substring(0,  fileName.LastIndexOf(".")), 10) +  fileName.Substring(fileName.LastIndexOf("."));
fileName = HttpUtility.UrlEncode(fileName, Encoding.UTF8);
}
else
{
fileName = ExcelFilePath.Substring(index + 1, ExcelFilePath.Length - index -  1);
fileName = GetLeftStr(fileName.Substring(0,  fileName.LastIndexOf(".")), 10) +  fileName.Substring(fileName.LastIndexOf("."));
//编码
fileName = HttpUtility.UrlEncode(fileName, Encoding.UTF8);
}
fileName = fileName.Substring(0, fileName.LastIndexOf("."));
ExcelFilePath = System.Web.HttpContext.Current.Server.MapPath(ExcelFilePath);
//目标html文件路径
object target = ExcelFilePath.Substring(0,  ExcelFilePath.LastIndexOf(".")) + ".html";
string target2 = ExcelFilePath.Substring(0,  ExcelFilePath.LastIndexOf("\\")) + "\\" + fileName +  "_files\\sheet001.htm";
if (!File.Exists(target.ToString()))
{
//为了保险,只读方式打开
//object readOnly = true;
//// 指定另存为格式(html)
//object format = Microsoft.Office.Interop.Excel.XlFileFormat.xlHtml;
////打开Excel文件
//oBook = excelApp.Workbooks.Open(ExcelFilePath, Unknown, readOnly,
//  Unknown, Unknown, Unknown, Unknown, Unknown, Unknown,
//  Unknown, Unknown, Unknown, Unknown, Unknown, Unknown);
//// 转换格式
//oBook.SaveAs(target, format, Unknown, Unknown, Unknown, Unknown,
//    Microsoft.Office.Interop.Excel.XlSaveAsAccessMode.xlNoChange,
//   Unknown, Unknown, Unknown, Unknown, Unknown);
Workbook wBook = new Workbook();
wBook.Open(ExcelFilePath);
wBook.Save(target.ToString(), FileFormatType.Html);
}
StreamReader sr = new StreamReader(target2.ToString(), Encoding.Default);
string strHtml = sr.ReadToEnd();
strHtml = InsertHeadHtml(strHtml, realPath);
strHtml = strHtml.Replace("window.location.replace", "");
strHtml = strHtml.Replace("filelist.xml", realPath + "/"  + fileName + "_files/filelist.xml");
strHtml = strHtml.Replace("stylesheet.css", realPath +  "/" + fileName + "_files/stylesheet.css");
HttpContext.Current.Response.Write(strHtml);
sr.Close();
}
catch  (Exception ex)
{
//记录异常
LogEntry logEntry = new LogEntry();
logEntry.Message = ex.Message;
logEntry.Title = "---->将Excel文件转换成HTML格式[ExcelToHtmlFile]";
logEntry.TimeStamp = DateTime.Now;
logEntry.LogEntryType = LogEntryType.Error;
logEntry.LogCatalog = LogCatalog.ExceptionLog;
logEntry.StackTrace = ex.StackTrace;
LogPosition logPosition = LogPosition.FileLog;
string positionParameter =  SysConfig.ToString(SysConfig.GetAppSetting("LogPath"));
SysLogger.Write(logEntry, logPosition, positionParameter);
}
}
#endregion
#region 将PPT文件转换成HTML格式
/// <summary>
/// 将PPT文件转换成HTML格式
/// </summary>
/// <param  name="PptFilePath">PPT文件路径</param>
private void PptToHtmlFile(string  PptFilePath)
{
ApplicationClass ac = new ApplicationClass();
Presentation pptFile = null;
try
{
string realPath = PptFilePath.Substring(0,  PptFilePath.LastIndexOf(".")) + ".html";
PptFilePath = System.Web.HttpContext.Current.Server.MapPath(PptFilePath);
//获得html文件名
object target = PptFilePath.Substring(0,  PptFilePath.LastIndexOf(".")) + ".html";
if (!File.Exists(target.ToString()))
{
if (PptFilePath.Contains(".pptx"))
{
pptFile = ac.Presentations.Open2007(PptFilePath, MsoTriState.msoCTrue,  MsoTriState.msoCTrue, MsoTriState.msoFalse, MsoTriState.msoFalse);
pptFile.SaveAs(target.ToString(), PpSaveAsFileType.ppSaveAsHTML,  MsoTriState.msoCTrue);
}
else if (PptFilePath.Contains(".ppt"))
{
pptFile = ac.Presentations.Open(PptFilePath, MsoTriState.msoCTrue,  MsoTriState.msoCTrue, MsoTriState.msoFalse);
pptFile.SaveAs(target.ToString(), PpSaveAsFileType.ppSaveAsHTML,  MsoTriState.msoCTrue);
}
}
//StreamReader sr = new StreamReader(target.ToString(), Encoding.Default);
//string strHtml = sr.ReadToEnd();
//Response.Write(strHtml);
HttpContext.Current.Response.Redirect(realPath);
}
finally
{
if (pptFile != null)
{
pptFile.Close();
}
ac.Quit();
GC.Collect();
}
}
#endregion
}
#endregion
}

您可能感兴趣的文章:

内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签:  C# PPT 转换 HTML