/// <summary>
/// word转成html
/// </summary>
/// <param name="wordBytes"></param>
/// <param name="saveDir">是否\\结尾无所谓</param>
/// <param name="wordType">doc/docx</param>
/// <param name="encode">保存的html编码</param>
/// <param name="dtTicks">文件名命名</param>
public static string WordToHtml(string wordFileName, Encoding encode)
{
////保存好word,该函数必须先保存好word
string dtTicks = DateTime.Now.Ticks.ToString();
//在此处放置用户代码以初始化页面
string dir = wordFileName.Substring(0, wordFileName.LastIndexOf("\\"));
string strSaveFileName = dir + "\\" + dtTicks + ".html";
Aspose.Words.Document awd = new Aspose.Words.Document(wordFileName);
awd.Save(strSaveFileName, Aspose.Words.SaveFormat.Html);
//读取html,返回
string html = GetStringByFile(strSaveFileName, encode);
////清除head内容
//html = html.Substring(html.IndexOf("<body"));
//html = html.Substring(html.IndexOf(">") + 1);
//html = html.Substring(0, html.LastIndexOf("</body>"));
return html;
/// word转成html
/// </summary>
/// <param name="wordBytes"></param>
/// <param name="saveDir">是否\\结尾无所谓</param>
/// <param name="wordType">doc/docx</param>
/// <param name="encode">保存的html编码</param>
/// <param name="dtTicks">文件名命名</param>
public static string WordToHtml(string wordFileName, Encoding encode)
{
////保存好word,该函数必须先保存好word
string dtTicks = DateTime.Now.Ticks.ToString();
//在此处放置用户代码以初始化页面
string dir = wordFileName.Substring(0, wordFileName.LastIndexOf("\\"));
string strSaveFileName = dir + "\\" + dtTicks + ".html";
Aspose.Words.Document awd = new Aspose.Words.Document(wordFileName);
awd.Save(strSaveFileName, Aspose.Words.SaveFormat.Html);
//读取html,返回
string html = GetStringByFile(strSaveFileName, encode);
////清除head内容
//html = html.Substring(html.IndexOf("<body"));
//html = html.Substring(html.IndexOf(">") + 1);
//html = html.Substring(0, html.LastIndexOf("</body>"));
return html;
}
//注意要引用 Aspose.Words.dll
本文详细介绍了如何将Word文档转换为HTML格式的过程,包括保存Word文档、使用Aspose.Words库进行转换,并且提供了相应的代码示例。重点突出了在转换过程中清除HTML头部内容以确保HTML文件的有效性。
2万+

被折叠的 条评论
为什么被折叠?



