前两天在园子里看到了BlackSoul 写的《asp.net将word转换为html保存 》的文章
http://www.51aspx.com/CT/Y33HPMEJERPC33/,觉得很实用,但是搭建项目时候缺不是那么回事儿,中间有很多问题,比如说word组建的引用、web.config权限的设置,看到了很多人在网上也在问这个问题,我把问题一一解决,测试成功,现在把全部项目源码文件分享给大家下载。
\n
项目截图:
\n
功能概述及注意事项:
\n
该源码主要是通过Asp.net2.0实现Word文档上传并自动转换为Html文件,原理是将word文档上传至服务器然后再转存为html格式文件,再解析html文件修改其页面样式和css。
\n
wordTmp为上传是word暂存文件夹
html为转换后html保存文件夹
\n
注意:
\n
请设置web.config中的<identity impersonate=”true” userName=”administrator” password=”51aspx”/>帐号和密码,否则会提示检索 COM 类工厂中 CLSID 为 {000209FF-0000-0000-C000-000000000046} 的组件时失败,原因是出现以下错误: 80070005。
\n
该用户类型为拥有user权限的用户即可
\n
示例Word文件是些笑话,希望能博得大家多多笑容!
\n
部分CS源码:
\n
public partial class _Default : System.Web.UI.Page
{
\n
// public WordToHTML() { }
\n
#region 上传文件并转换为html wordToHtml(wordFilePath)
\n
///
\n
/// 上传文件并转存为html
\n
///
\n
/// word文档在客户机的位置
/// 上传的html文件的地址
public string wordToHtml(System.Web.UI.HtmlControls.HtmlInputFile wordFilePath)
{
Microsoft.Office.Interop.Word.ApplicationClass word = new Microsoft.Office.Interop.Word.ApplicationClass();
Type wordType = word.GetType();
Microsoft.Office.Interop.Word.Documents docs = word.Documents;
\n
// 打开文件
Type docsType = docs.GetType();
\n
//应当先把文件上传至服务器然后再解析文件为html
string filePath = uploadWord(wordFilePath);
\n
//判断是否上传文件成功
if (filePath == “0″)
return “0″;
//判断是否为word文件
if (filePath == “1″)
return “1″;
\n
object fileName = filePath;
\n
Microsoft.Office.Interop.Word.Document doc = (Microsoft.Office.Interop.Word.Document) docsType.InvokeMember(“Open”,
System.Reflection.BindingFlags.InvokeMethod, null, docs, new Object[] { fileName, true, true });
\n
// 转换格式,另存为html
Type docType = doc.GetType();
\n
string filename = System.DateTime.Now.Year.ToString() + System.DateTime.Now.Month.ToString() + System.DateTime.Now.Day.ToString() +
System.DateTime.Now.Hour.ToString() + System.DateTime.Now.Minute.ToString() + System.DateTime.Now.Second.ToString();
\n
//被转换的html文档保存的位置
string ConfigPath = HttpContext.Current.Server.MapPath(“html/” + filename + “.html”);
object saveFileName = ConfigPath;
\n
/*下面是Microsoft Word 9 Object Library的写法,如果是10,可能写成:
* docType.InvokeMember(“SaveAs”, System.Reflection.BindingFlags.InvokeMethod,
* null, doc, new object[]{saveFileName, Word.WdSaveFormat.wdFormatFilteredHTML});
* 其它格式:
* wdFormatHTML
* wdFormatDocument
* wdFormatDOSText
* wdFormatDOSTextLineBreaks
* wdFormatEncodedText
* wdFormatRTF
* wdFormatTemplate
* wdFormatText
* wdFormatTextLineBreaks
* wdFormatUnicodeText
*/
docType.InvokeMember(“SaveAs”, System.Reflection.BindingFlags.InvokeMethod,
null, doc, new object[] { saveFileName, Microsoft.Office.Interop.Word.WdSaveFormat.wdFormatFilteredHTML });
\n
// 退出 Word
wordType.InvokeMember(“Quit”, System.Reflection.BindingFlags.InvokeMethod, null, word, null);
//转到新生成的页面
return (“/” + filename + “.html”);
}
#endregion
\n
public string uploadWord(System.Web.UI.HtmlControls.HtmlInputFile uploadFiles)
{
if (uploadFiles.PostedFile != null)
{
string fileName = uploadFiles.PostedFile.FileName;
int extendNameIndex = fileName.LastIndexOf(“.”);
string extendName = fileName.Substring(extendNameIndex);
string newName = “”;
try
{
//验证是否为word格式
if (extendName == “.doc”)
{
DateTime now = DateTime.Now;
newName = now.DayOfYear.ToString() + uploadFiles.PostedFile.ContentLength.ToString();
//上传路径 指当前上传页面的同一级的目录下面的wordTmp路径
uploadFiles.PostedFile.SaveAs(System.Web.HttpContext.Current.Server.MapPath(“wordTmp/” + newName + extendName));
}
else
{
return “1″;
}
}
catch
{
return “0″;
}
//return “http://” + HttpContext.Current.Request.Url.Host + HttpContext.Current.Request.ApplicationPath + “/wordTmp/” + newName + extendName;
return System.Web.HttpContext.Current.Server.MapPath(“wordTmp/” + newName + extendName);
}
\n
else
{
return “0″;
}
}
\n
protected void btnUpload_Click(object sender, EventArgs e)
{
try
{
//上传
uploadWord(File1);
//转换
wordToHtml(File1);
}
catch (Exception ex)
{
throw ex;
}
finally
{
Response.Write(“恭喜,转换成功!”);
}
}
\n
}
\n
完整项目源码下载
http://www.51aspx.com/CV/WordToHtml/
\n
来源:CNBLOGS