c#把网页导出成word
以下是使用C#将网页导出为Word文档的示例代码:
using System;
using System.IO;
using System.Net;
using System.Text;
using System.Web;
using Microsoft.Office.Interop.Word;
namespace ConsoleApp1
{
class Program
{
static void Main(string[] args)
{
string url = "https://www.example.com"; // 网页地址
// 创建Word应用程序对象
Application word = new Application();
Document doc = word.Documents.Add();
// 获取网页内容
WebClient webClient = new WebClient();
byte[] data = webClient.DownloadData(url);
string html = Encoding.UTF8.GetString(data);
// 把HTML内容转换为Word文档
using (MemoryStream stream = new MemoryStream())
{
StreamWriter writer = new StreamWriter(stream, Encoding.GetEncoding("gb2312"));
writer.Write(html);
writer.Flush();
stream.Seek(0, SeekOrigin.Begin);
doc.Content.InsertFile(stream, ConfirmConversions: false, Link: false, Attachment: false);
}
// 保存文档
object fileName = Path.Combine(Environment.GetFolderPath(Environment.SpecialFolder.Desktop), "output.docx");
doc.SaveAs2(ref fileName);
doc.Close();
word.Quit();
}
}
}
需要注意的是,此代码需要安装Microsoft.Office.Interop.Word库,以及Microsoft Word软件。另外,导出的Word文档可能会存在格式不完全一致的问题,需要手动调整格式。
原文地址: https://www.cveoy.top/t/topic/btot 著作权归作者所有。请勿转载和采集!