C#实现将PPT转换成HTML的方法

本文是一个C#的小程序,主要实现将ppt转换成html的功能,方法很多,此处与大家分享一下,希望能对大家的项目开发起到一定的借鉴作用。

主要功能代码如下:

using System;
 using System.Collections.Generic;
 using System.Text;
 using System.IO;
 using PPT = Microsoft.Office.Interop.PowerPoint;
 using System.Reflection;

namespace WritePptDemo
 {
   class Program
   {
     static void Main(string[] args)
     {
       string  path;     //文件路径变量

       PPT.Application pptApp;   //Excel应用程序变量
        PPT.Presentation pptDoc;   //Excel文档变量

       PPT.Presentation pptDoctmp;

      path  = @"C:\MyPPT.ppt";   //路径
       pptApp =  new PPT.ApplicationClass();  //初始化

      //如果已存在,则删除
       if  (File.Exists((string)path))
       {
          File.Delete((string)path);
       }

      //由于使用的是COM库,因此有许多变量需要用Nothing代替
       Object  Nothing = Missing.Value;
       pptDoc =  pptApp.Presentations.Add(Microsoft.Office.Core.MsoTriState.msoFalse);
        pptDoc.Slides.Add(1,  Microsoft.Office.Interop.PowerPoint.PpSlideLayout.ppLayoutText);

       string text = "示例文本";

      foreach  (PPT.Slide slide in pptDoc.Slides)
       {
          foreach (PPT.Shape shape in slide.Shapes)
          {
            shape.TextFrame.TextRange.InsertAfter(text);
          }
       }

        //WdSaveFormat为Excel文档的保存格式
        PPT.PpSaveAsFileType format = PPT.PpSaveAsFileType.ppSaveAsDefault;

      //将excelDoc文档对象的内容保存为XLSX文档 
        pptDoc.SaveAs(path, format, Microsoft.Office.Core.MsoTriState.msoFalse);

      //关闭excelDoc文档对象 
        pptDoc.Close();

      //关闭excelApp组件对象 
        pptApp.Quit();

       Console.WriteLine(path + " 创建完毕!");

       Console.ReadLine();


       string  pathHtml = @"c:\MyPPT.html";

       PPT.Application pa = new PPT.ApplicationClass();

       pptDoctmp = pa.Presentations.Open(path,  Microsoft.Office.Core.MsoTriState.msoTrue,  Microsoft.Office.Core.MsoTriState.msoFalse,  Microsoft.Office.Core.MsoTriState.msoFalse);
        PPT.PpSaveAsFileType formatTmp = PPT.PpSaveAsFileType.ppSaveAsHTML;
        pptDoctmp.SaveAs(pathHtml, formatTmp,  Microsoft.Office.Core.MsoTriState.msoFalse);
        pptDoctmp.Close();
       pa.Quit();
        Console.WriteLine(pathHtml + " 创建完毕!");
     }
   }
 }
 

以上程序是使用C# 先创建一个ppt 文件并向里面写入了文字,然后再把此ppt 转换成html  ,对于上面程序需要说明的其实就是

引用dll的问题, 在项目中添加引用,在com 组件中选择 microsoft powerpoint 11.0 object   library ,而如果你的电脑没有安装 office 2003 是不会有这个的,而如果安装的是office 2007 则是microsoft powerpoint 12.0 object   library。而且即使你引用成功后,还是会编译不通过,是因为少安装了 office   PIA  ,在安装office 时,如果你是选择的典型安装是不会安装这个的,因为这个只针对开发人员才会用到。可以到网上下载一个 office PIA 安装下就ok了
 
Office文件转换成Html格式功能代码如下:  

 using  Microsoft.Office.Core;
 using Microsoft.Office.Interop.PowerPoint;

using System;
 using System.Collections.Generic;
 using System.Linq;
 using System.Text;
 using System.Web;
 using System.IO;
 using System.Text.RegularExpressions;
 using Nd.Webs;
 using Aspose.Cells;
 using Aspose.Words;
 using ND.CommonHelper;
 using Microsoft.Office.Interop.PowerPoint;
 using Microsoft.Office.Core;

namespace Api.Note.Base
 {
   #region Office文件转换成Html格式
   class OfficeHtmlBo
   {
     #region InsertHeadHtml
     /// <summary>
     /// InsertHeadHtml
     /// </summary>
     /// <param  name="WordFilePath">InsertHeadHtml</param>
     private string  InsertHeadHtml(string strHtml, string realPath)
     {
       int index  = strHtml.IndexOf("<body");
       strHtml =  strHtml.Insert(index, "<div  style='height:60px;font-size:14px;margin:0px 0px  12px 0px;padding:14px 4px 12px 12px;line-height:24px;height:1%;'>以下是该文档的HTML预览效果。<br/><span>由于是网页提取显示word中的内容,有可能部分显示与源文档中有差异,如想查看更准确的信息,</span>您可以点击&nbsp;<a  style='color:6699FF;text-decoration:underline;'  href='/Lib/UdControls/Download.aspx?action=Download&appFormCode=" +  HttpContext.Current.Request.QueryString["appFormCode"].ToString() +  "&path=" +  HttpContext.Current.Request.QueryString["path"].ToString() +  "&encrypt=" + HttpContext.Current.Request.QueryString["encrypt"].ToString()  + "'><b>下载原始附件</b></a></div>");

      Regex  reg = new  Regex(@"(?<start><img[^>]+?src="")(?<src>[^""]+?)(?<end>""[^>]+?>)");
       strHtml =  reg.Replace(strHtml, delegate(Match m)
       {
          return string.Format("{0}{1}{2}{3}",
            m.Groups["start"].Value,
            realPath,
            m.Groups["src"].Value,
            m.Groups["end"].Value
            );
       });

       return strHtml;
     }
     #endregion

    #region GetLeftStr
     /// <summary>
     /// 截取字符串左边指定长度
     /// </summary>
     /// <param  name="str"></param>
     /// <param  name="length"></param>
     ///  <returns></returns>
     public string GetLeftStr(string  str, int length)
     {
       length =  length * 2;
       string  tempStr = "";
       int i = 0;
       foreach  (char c in str)
       {
          tempStr += c.ToString();
          if (((int)c >= 33) && ((int)c <= 126))
          {
            //字母和符号原样保留 
            i += 1;
          }
          else
          {
            i += 2;
          }
          if (i >= length)
          {
            return tempStr;
          }
       }
       return  str;
     }

     #endregion

    #region 将Word文档转换成HTML格式
     /// <summary>
     /// 将Word文档转换成HTML格式
     /// </summary>
     /// <param  name="WordFilePath">Word文档格式</param>
     private void WordToHtmlFile(string  WordFilePath)
     {
       try
       {
          // 指定原文件和目标文件
          string realPath = WordFilePath.Substring(0,  WordFilePath.LastIndexOf("/") + 1);
          WordFilePath = System.Web.HttpContext.Current.Server.MapPath(WordFilePath);
          object target = WordFilePath.Substring(0,  WordFilePath.LastIndexOf(".")) + ".html";
          //string realPath = WordFilePath.Substring(0,  WordFilePath.LastIndexOf(".")) + ".html";

         if (!File.Exists(target.ToString()))
          {
            Document doc = new Document(WordFilePath);
            doc.Save(target.ToString(), SaveFormat.Html);
          }
         StreamReader sr = new StreamReader(target.ToString(), Encoding.Default);
          string strHtml = sr.ReadToEnd();
         strHtml = InsertHeadHtml(strHtml, realPath);
          HttpContext.Current.Response.Write(strHtml);
         sr.Close();
       }
       catch  (Exception ex)
       {
          //记录异常
          LogEntry logEntry = new LogEntry();
          logEntry.Message = ex.Message;
          logEntry.Title = "---->将Word文档转换成HTML格式异常[WordToHtmlFile]";
          logEntry.TimeStamp = DateTime.Now;
          logEntry.LogEntryType = LogEntryType.Error;
          logEntry.LogCatalog = LogCatalog.ExceptionLog;
          logEntry.StackTrace = ex.StackTrace;
          LogPosition logPosition = LogPosition.FileLog;
          string positionParameter =  SysConfig.ToString(SysConfig.GetAppSetting("LogPath"));
          SysLogger.Write(logEntry, logPosition, positionParameter);
       }
     }
     #endregion

    #region 将Excel文件转换成HTML格式
     /// <summary>
     /// 将Excel文件转换成HTML格式
     /// </summary>
     /// <param  name="ExcelFilePath">Excel文件路径</param>
     private void  ExcelToHtmlFile(string ExcelFilePath)
     {
       try
       {
          string realPath = ExcelFilePath.Substring(0,  ExcelFilePath.LastIndexOf("/") + 1);
          int index = ExcelFilePath.LastIndexOf("/");
          string fileName;
          if (ExcelFilePath.IndexOf(":") != -1)
          {
            fileName = ExcelFilePath.Split(new char[] { ':' })[0].ToString();
            fileName = GetLeftStr(fileName.Substring(0,  fileName.LastIndexOf(".")), 10) +  fileName.Substring(fileName.LastIndexOf("."));
            fileName = HttpUtility.UrlEncode(fileName, Encoding.UTF8);
          }
          else
          {
            fileName = ExcelFilePath.Substring(index + 1, ExcelFilePath.Length - index -  1);
            fileName = GetLeftStr(fileName.Substring(0,  fileName.LastIndexOf(".")), 10) +  fileName.Substring(fileName.LastIndexOf("."));
            //编码
            fileName = HttpUtility.UrlEncode(fileName, Encoding.UTF8);
          }
          fileName = fileName.Substring(0, fileName.LastIndexOf("."));
          ExcelFilePath = System.Web.HttpContext.Current.Server.MapPath(ExcelFilePath);
          //目标html文件路径
          object target = ExcelFilePath.Substring(0,  ExcelFilePath.LastIndexOf(".")) + ".html";
         string target2 = ExcelFilePath.Substring(0,  ExcelFilePath.LastIndexOf("\\")) + "\\" + fileName +  "_files\\sheet001.htm";
          if (!File.Exists(target.ToString()))
          {
            //为了保险,只读方式打开 
            //object readOnly = true;
            //// 指定另存为格式(html) 
            //object format = Microsoft.Office.Interop.Excel.XlFileFormat.xlHtml;
           ////打开Excel文件
            //oBook = excelApp.Workbooks.Open(ExcelFilePath, Unknown, readOnly,
            //  Unknown, Unknown, Unknown, Unknown, Unknown, Unknown,
            //  Unknown, Unknown, Unknown, Unknown, Unknown, Unknown);
           //// 转换格式 
            //oBook.SaveAs(target, format, Unknown, Unknown, Unknown, Unknown,
            //    Microsoft.Office.Interop.Excel.XlSaveAsAccessMode.xlNoChange,
            //   Unknown, Unknown, Unknown, Unknown, Unknown);

           Workbook wBook = new Workbook();
            wBook.Open(ExcelFilePath);
            wBook.Save(target.ToString(), FileFormatType.Html);
          }

         StreamReader sr = new StreamReader(target2.ToString(), Encoding.Default);
          string strHtml = sr.ReadToEnd();

         strHtml = InsertHeadHtml(strHtml, realPath);

         strHtml = strHtml.Replace("window.location.replace", "");
          strHtml = strHtml.Replace("filelist.xml", realPath + "/"  + fileName + "_files/filelist.xml");
          strHtml = strHtml.Replace("stylesheet.css", realPath +  "/" + fileName + "_files/stylesheet.css");
          HttpContext.Current.Response.Write(strHtml);

         sr.Close();
       }
       catch  (Exception ex)
       {
          //记录异常
          LogEntry logEntry = new LogEntry();
          logEntry.Message = ex.Message;
          logEntry.Title = "---->将Excel文件转换成HTML格式[ExcelToHtmlFile]";
          logEntry.TimeStamp = DateTime.Now;
          logEntry.LogEntryType = LogEntryType.Error;
          logEntry.LogCatalog = LogCatalog.ExceptionLog;
          logEntry.StackTrace = ex.StackTrace;
          LogPosition logPosition = LogPosition.FileLog;
          string positionParameter =  SysConfig.ToString(SysConfig.GetAppSetting("LogPath"));
          SysLogger.Write(logEntry, logPosition, positionParameter);
       }
     }
     #endregion

    #region 将PPT文件转换成HTML格式
     /// <summary>
     /// 将PPT文件转换成HTML格式
     /// </summary>
     /// <param  name="PptFilePath">PPT文件路径</param>
     private void PptToHtmlFile(string  PptFilePath)
     {
        ApplicationClass ac = new ApplicationClass();
        Presentation pptFile = null;
       try
       {
          string realPath = PptFilePath.Substring(0,  PptFilePath.LastIndexOf(".")) + ".html";
          PptFilePath = System.Web.HttpContext.Current.Server.MapPath(PptFilePath);
          //获得html文件名
          object target = PptFilePath.Substring(0,  PptFilePath.LastIndexOf(".")) + ".html";

         if (!File.Exists(target.ToString()))
          {
            if (PptFilePath.Contains(".pptx"))
            {
              pptFile = ac.Presentations.Open2007(PptFilePath, MsoTriState.msoCTrue,  MsoTriState.msoCTrue, MsoTriState.msoFalse, MsoTriState.msoFalse);
              pptFile.SaveAs(target.ToString(), PpSaveAsFileType.ppSaveAsHTML,  MsoTriState.msoCTrue);
            }
            else if (PptFilePath.Contains(".ppt"))
            {
              pptFile = ac.Presentations.Open(PptFilePath, MsoTriState.msoCTrue,  MsoTriState.msoCTrue, MsoTriState.msoFalse);
              pptFile.SaveAs(target.ToString(), PpSaveAsFileType.ppSaveAsHTML,  MsoTriState.msoCTrue);
            }
          }
          //StreamReader sr = new StreamReader(target.ToString(), Encoding.Default);
          //string strHtml = sr.ReadToEnd();
          //Response.Write(strHtml);
          HttpContext.Current.Response.Redirect(realPath);
       }
       finally
       {
          if (pptFile != null)
          {
            pptFile.Close();
          }
          ac.Quit();
          GC.Collect();
       }
     }
     #endregion
   }
   #endregion
}