隐藏

C#Word转Html的类

发布:2021/11/29 15:26:05作者:管理员 来源:本站 浏览次数:860

已验证,可以在指定的文件目录下成功将doc文件转html

using System;

using System.Collections.Generic;
using System.IO;
using System.Linq;
using System.Text;

using System.Threading.Tasks;

 class WordToHtml
    {
        public static void CreateWordToHtmlFile(string WordFileDir)
        {
            DealWithWordFile(WordFileDir);
        }
        /// <summary>
        /// 搜索WordFileDir在的*.doc文件
        /// </summary>
        /// <param name="WordFileDir"></param>
        private static void DealWithWordFile(string WordFileDir)
        {
            //创建数组保存源文件夹下的文件名
            string[] strFiles = Directory.GetFiles(WordFileDir, "*.doc");
            for (int i = 0; i < strFiles.Length; i++)
            {
                WordToHtmlFile(strFiles[i]);
            }

            DirectoryInfo dirInfo = new DirectoryInfo(WordFileDir);
            //取得源文件夹下的所有子文件夹名称
            DirectoryInfo[] ZiPath = dirInfo.GetDirectories();
            for (int j = 0; j < ZiPath.Length; j++)
            {
                //获取所有子文件夹名
                string strZiPath = WordFileDir + "/" + ZiPath[j].ToString();
                //把得到的子文件夹当成新的源文件夹,从头开始新一轮的搜索
                DealWithWordFile(strZiPath);
            }
        }
        /// <summary>
        /// 转化
        /// </summary>
        /// <param name="WordFilePath"></param>
        private static void WordToHtmlFile(string WordFilePath)
        {
            try
            {
                Microsoft.Office.Interop.Word.Application newApp = new Microsoft.Office.Interop.Word.Application();
                // 指定原文件和目标文件
                object Source = WordFilePath;
                string SaveHtmlPath = WordFilePath.Substring(0, WordFilePath.Length - 3) + "html";
                object Target = SaveHtmlPath;

                // 缺省参数  
                object Unknown = Type.Missing;

                //为了保险,只读方式打开
                object readOnly = true;

                // 打开doc文件
                Microsoft.Office.Interop.Word.Document doc = newApp.Documents.Open(ref Source, ref Unknown,
                     ref readOnly, ref Unknown, ref Unknown,
                     ref Unknown, ref Unknown, ref Unknown,
                     ref Unknown, ref Unknown, ref Unknown,
                     ref Unknown, ref Unknown, ref Unknown,
                     ref Unknown, ref Unknown);

                // 指定另存为格式(rtf)
                object format = Microsoft.Office.Interop.Word.WdSaveFormat.wdFormatHTML;
                // 转换格式
                doc.SaveAs(ref Target, ref format,
                        ref Unknown, ref Unknown, ref Unknown,
                        ref Unknown, ref Unknown, ref Unknown,
                        ref Unknown, ref Unknown, ref Unknown,
                        ref Unknown, ref Unknown, ref Unknown,
                        ref Unknown, ref Unknown);

                // 关闭文档和Word程序
                doc.Close(ref Unknown, ref Unknown, ref Unknown);
                newApp.Quit(ref Unknown, ref Unknown, ref Unknown);
            }
            catch (Exception e)
            {
                System.Windows.Forms.MessageBox.Show(e.Message);
            }
        }
    }