这只是一个小程序,就是将ppt转换成html,方法很多,为了以后备用,在此记录一下,也和大家分享 源码如下:
using System; using System.Collections.Generic; using System.Text; using System.IO; using PPT = Microsoft.Office.Interop.PowerPoint; using System.Reflection;
namespace WritePptDemo { class Program { static void Main(string[] args) { string path; //文件路径变量
PPT.Application pptApp; //Excel应用程序变量 PPT.Presentation pptDoc; //Excel文档变量
PPT.Presentation pptDoctmp;
path = @"C:\MyPPT.ppt"; //路径 pptApp = new PPT.ApplicationClass(); //初始化
//如果已存在,则删除 if (File.Exists((string)path)) { File.Delete((string)path); }
//由于使用的是COM库,因此有许多变量需要用Nothing代替 Object Nothing = Missing.Value; pptDoc = pptApp.Presentations.Add(Microsoft.Office.Core.MsoTriState.msoFalse); pptDoc.Slides.Add(1, Microsoft.Office.Interop.PowerPoint.PpSlideLayout.ppLayoutText);
string text = "示例文本";
foreach (PPT.Slide slide in pptDoc.Slides) { foreach (PPT.Shape shape in slide.Shapes) { shape.TextFrame.TextRange.InsertAfter(text); } }
//WdSaveFormat为Excel文档的保存格式 PPT.PpSaveAsFileType format = PPT.PpSaveAsFileType.ppSaveAsDefault;
//将excelDoc文档对象的内容保存为XLSX文档 pptDoc.SaveAs(path, format, Microsoft.Office.Core.MsoTriState.msoFalse);
//关闭excelDoc文档对象 pptDoc.Close();
//关闭excelApp组件对象 pptApp.Quit();
Console.WriteLine(path + " 创建完毕!");
Console.ReadLine();
string pathHtml = @"c:\MyPPT.html";
PPT.Application pa = new PPT.ApplicationClass();
pptDoctmp = pa.Presentations.Open(path, Microsoft.Office.Core.MsoTriState.msoTrue, Microsoft.Office.Core.MsoTriState.msoFalse, Microsoft.Office.Core.MsoTriState.msoFalse); PPT.PpSaveAsFileType formatTmp = PPT.PpSaveAsFileType.ppSaveAsHTML; pptDoctmp.SaveAs(pathHtml, formatTmp, Microsoft.Office.Core.MsoTriState.msoFalse); pptDoctmp.Close(); pa.Quit(); Console.WriteLine(pathHtml + " 创建完毕!"); } } } 以上程序是使用C# 先创建一个ppt 文件并向里面写入了文字,然后再把此ppt 转换成html ,对于上面程序需要说明的其实就是 引用dll的问题, 在项目中添加引用,在com 组件中选择 microsoft powerpoint 11.0 object library ,而如果你的电脑没有安装 office 2003 是不会有这个的,而如果安装的是office 2007 则是microsoft powerpoint 12.0 object library。而且即使你引用成功后,还是会编译不通过,是因为少安装了 office PIA ,在安装office 时,如果你是选择的典型安装是不会安装这个的,因为这个只针对开发人员才会用到。可以到网上下载一个 office PIA 安装下就ok了 ----------------------------------Office文件转换成Html格式--------------------------------------------------------------------------------------------------------------------------------------------------------- using Microsoft.Office.Core; using Microsoft.Office.Interop.PowerPoint;
using System; using System.Collections.Generic; using System.Linq; using System.Text; using System.Web; using System.IO; using System.Text.RegularExpressions; using Nd.Webs; using Aspose.Cells; using Aspose.Words; using ND.CommonHelper; using Microsoft.Office.Interop.PowerPoint; using Microsoft.Office.Core;
namespace Api.Note.Base { #region Office文件转换成Html格式 class OfficeHtmlBo { #region InsertHeadHtml /// <summary> /// InsertHeadHtml /// </summary> /// <param name="WordFilePath">InsertHeadHtml</param> private string InsertHeadHtml(string strHtml, string realPath) { int index = strHtml.IndexOf("<body"); strHtml = strHtml.Insert(index, "<div style='height:60px;font-size:14px;margin:0px 0px 12px 0px;padding:14px 4px 12px 12px;line-height:24px;height:1%;'>以下是该文档的HTML预览效果。<br/><span>由于是网页提取显示word中的内容,有可能部分显示与源文档中有差异,如想查看更准确的信息,</span>您可以点击 <a style='color:6699FF;text-decoration:underline;' href='/Lib/UdControls/Download.aspx?action=Download&appFormCode=" + HttpContext.Current.Request.QueryString["appFormCode"].ToString() + "&path=" + HttpContext.Current.Request.QueryString["path"].ToString() + "&encrypt=" + HttpContext.Current.Request.QueryString["encrypt"].ToString() + "'><b>下载原始附件</b></a></div>");
Regex reg = new Regex(@"(?<start><img[^>]+?src="")(?<src>[^""]+?)(?<end>""[^>]+?>)"); strHtml = reg.Replace(strHtml, delegate(Match m) { return string.Format("{0}{1}{2}{3}", m.Groups["start"].Value, realPath, m.Groups["src"].Value, m.Groups["end"].Value ); });
return strHtml; } #endregion
#region GetLeftStr /// <summary> /// 截取字符串左边指定长度 /// </summary> /// <param name="str"></param> /// <param name="length"></param> /// <returns></returns> public string GetLeftStr(string str, int length) { length = length * 2; string tempStr = ""; int i = 0; foreach (char c in str) { tempStr += c.ToString(); if (((int)c >= 33) && ((int)c <= 126)) { //字母和符号原样保留 i += 1; } else { i += 2; } if (i >= length) { return tempStr; } } return str; }
#endregion
#region 将Word文档转换成HTML格式 /// <summary> /// 将Word文档转换成HTML格式 /// </summary> /// <param name="WordFilePath">Word文档格式</param> private void WordToHtmlFile(string WordFilePath) { try { // 指定原文件和目标文件 string realPath = WordFilePath.Substring(0, WordFilePath.LastIndexOf("/") + 1); WordFilePath = System.Web.HttpContext.Current.Server.MapPath(WordFilePath); object target = WordFilePath.Substring(0, WordFilePath.LastIndexOf(".")) + ".html"; //string realPath = WordFilePath.Substring(0, WordFilePath.LastIndexOf(".")) + ".html";
if (!File.Exists(target.ToString())) { Document doc = new Document(WordFilePath); doc.Save(target.ToString(), SaveFormat.Html); }
StreamReader sr = new StreamReader(target.ToString(), Encoding.Default); string strHtml = sr.ReadToEnd();
strHtml = InsertHeadHtml(strHtml, realPath); HttpContext.Current.Response.Write(strHtml);
sr.Close(); } catch (Exception ex) { //记录异常 LogEntry logEntry = new LogEntry(); logEntry.Message = ex.Message; logEntry.Title = "---->将Word文档转换成HTML格式异常[WordToHtmlFile]"; logEntry.TimeStamp = DateTime.Now; logEntry.LogEntryType = LogEntryType.Error; logEntry.LogCatalog = LogCatalog.ExceptionLog; logEntry.StackTrace = ex.StackTrace; LogPosition logPosition = LogPosition.FileLog; string positionParameter = SysConfig.ToString(SysConfig.GetAppSetting("LogPath")); SysLogger.Write(logEntry, logPosition, positionParameter); } } #endregion
#region 将Excel文件转换成HTML格式 /// <summary> /// 将Excel文件转换成HTML格式 /// </summary> /// <param name="ExcelFilePath">Excel文件路径</param> private void ExcelToHtmlFile(string ExcelFilePath) { try { string realPath = ExcelFilePath.Substring(0, ExcelFilePath.LastIndexOf("/") + 1); int index = ExcelFilePath.LastIndexOf("/"); string fileName; if (ExcelFilePath.IndexOf(":") != -1) { fileName = ExcelFilePath.Split(new char[] { ':' })[0].ToString(); fileName = GetLeftStr(fileName.Substring(0, fileName.LastIndexOf(".")), 10) + fileName.Substring(fileName.LastIndexOf(".")); fileName = HttpUtility.UrlEncode(fileName, Encoding.UTF8); } else { fileName = ExcelFilePath.Substring(index + 1, ExcelFilePath.Length - index - 1); fileName = GetLeftStr(fileName.Substring(0, fileName.LastIndexOf(".")), 10) + fileName.Substring(fileName.LastIndexOf(".")); //编码 fileName = HttpUtility.UrlEncode(fileName, Encoding.UTF8); } fileName = fileName.Substring(0, fileName.LastIndexOf(".")); ExcelFilePath = System.Web.HttpContext.Current.Server.MapPath(ExcelFilePath); //目标html文件路径 object target = ExcelFilePath.Substring(0, ExcelFilePath.LastIndexOf(".")) + ".html";
string target2 = ExcelFilePath.Substring(0, ExcelFilePath.LastIndexOf("\\")) + "\\" + fileName + "_files\\sheet001.htm"; if (!File.Exists(target.ToString())) { //为了保险,只读方式打开 //object readOnly = true; //// 指定另存为格式(html) //object format = Microsoft.Office.Interop.Excel.XlFileFormat.xlHtml;
////打开Excel文件 //oBook = excelApp.Workbooks.Open(ExcelFilePath, Unknown, readOnly, // Unknown, Unknown, Unknown, Unknown, Unknown, Unknown, // Unknown, Unknown, Unknown, Unknown, Unknown, Unknown);
//// 转换格式 //oBook.SaveAs(target, format, Unknown, Unknown, Unknown, Unknown, // Microsoft.Office.Interop.Excel.XlSaveAsAccessMode.xlNoChange, // Unknown, Unknown, Unknown, Unknown, Unknown);
Workbook wBook = new Workbook(); wBook.Open(ExcelFilePath); wBook.Save(target.ToString(), FileFormatType.Html); }
StreamReader sr = new StreamReader(target2.ToString(), Encoding.Default); string strHtml = sr.ReadToEnd();
strHtml = InsertHeadHtml(strHtml, realPath);
strHtml = strHtml.Replace("window.location.replace", ""); strHtml = strHtml.Replace("filelist.xml", realPath + "/" + fileName + "_files/filelist.xml"); strHtml = strHtml.Replace("stylesheet.css", realPath + "/" + fileName + "_files/stylesheet.css"); HttpContext.Current.Response.Write(strHtml);
sr.Close(); } catch (Exception ex) { //记录异常 LogEntry logEntry = new LogEntry(); logEntry.Message = ex.Message; logEntry.Title = "---->将Excel文件转换成HTML格式[ExcelToHtmlFile]"; logEntry.TimeStamp = DateTime.Now; logEntry.LogEntryType = LogEntryType.Error; logEntry.LogCatalog = LogCatalog.ExceptionLog; logEntry.StackTrace = ex.StackTrace; LogPosition logPosition = LogPosition.FileLog; string positionParameter = SysConfig.ToString(SysConfig.GetAppSetting("LogPath")); SysLogger.Write(logEntry, logPosition, positionParameter); } } #endregion
#region 将PPT文件转换成HTML格式 /// <summary> /// 将PPT文件转换成HTML格式 /// </summary> /// <param name="PptFilePath">PPT文件路径</param> private void PptToHtmlFile(string PptFilePath) { ApplicationClass ac = new ApplicationClass(); Presentation pptFile = null; try { string realPath = PptFilePath.Substring(0, PptFilePath.LastIndexOf(".")) + ".html"; PptFilePath = System.Web.HttpContext.Current.Server.MapPath(PptFilePath); //获得html文件名 object target = PptFilePath.Substring(0, PptFilePath.LastIndexOf(".")) + ".html";
if (!File.Exists(target.ToString())) { if (PptFilePath.Contains(".pptx")) { pptFile = ac.Presentations.Open2007(PptFilePath, MsoTriState.msoCTrue, MsoTriState.msoCTrue, MsoTriState.msoFalse, MsoTriState.msoFalse); pptFile.SaveAs(target.ToString(), PpSaveAsFileType.ppSaveAsHTML, MsoTriState.msoCTrue); } else if (PptFilePath.Contains(".ppt")) { pptFile = ac.Presentations.Open(PptFilePath, MsoTriState.msoCTrue, MsoTriState.msoCTrue, MsoTriState.msoFalse); pptFile.SaveAs(target.ToString(), PpSaveAsFileType.ppSaveAsHTML, MsoTriState.msoCTrue); } } //StreamReader sr = new StreamReader(target.ToString(), Encoding.Default); //string strHtml = sr.ReadToEnd(); //Response.Write(strHtml); HttpContext.Current.Response.Redirect(realPath); } finally { if (pptFile != null) { pptFile.Close(); } ac.Quit(); GC.Collect(); } } #endregion } #endregion
}
|