怎么把html代码转换成文本,html代码转换成为纯文本

先解码。接着转换为纯文本,用这段代码:

public static string HtmlToText(string source)

{

string result;

//remove line breaks,tabs

result = source.Replace("\r", " ");

result = result.Replace("\n", " ");

result = result.Replace("\t", " ");

//remove the header

result = Regex.Replace(result, "(

).*()", string.Empty, RegexOptions.IgnoreCase);

result = Regex.Replace(result, @"])*>", "

result = Regex.Replace(result, @"()", string.Empty, RegexOptions.IgnoreCase);

//remove all styles

result = Regex.Replace(result, @"])*>", "

result = Regex.Replace(result, "()", string.Empty, RegexOptions.IgnoreCase);

//insert tabs in spaces of

tags

result = Regex.Replace(result, @"])*>", " ", RegexOptions.IgnoreCase);

//insert line breaks in places of
and

tags

result = Regex.Replace(result, @"", "\r", RegexOptions.IgnoreCase);

result = Regex.Replace(result, @"", "\r", RegexOptions.IgnoreCase);

//insert line paragraphs in places of

and

tags

result = Regex.Replace(result, @"])*>", "\r\r", RegexOptions.IgnoreCase);

result = Regex.Replace(result, @"])*>", "\r\r", RegexOptions.IgnoreCase);

//remove anything thats enclosed inside < >

result = Regex.Replace(result, @"]*>", string.Empty, RegexOptions.IgnoreCase);

//replace special characters:

result = Regex.Replace(result, @"&", "&", RegexOptions.IgnoreCase);

result = Regex.Replace(result, @" ", " ", RegexOptions.IgnoreCase);

result = Regex.Replace(result, @"<", "

result = Regex.Replace(result, @">", ">", RegexOptions.IgnoreCase);

result = Regex.Replace(result, @"&(.{2,6});", string.Empty, RegexOptions.IgnoreCase);

//remove extra line breaks and tabs

result = Regex.Replace(result, @" ( )+", " ");

result = Regex.Replace(result, "(\r)( )+(\r)", "\r\r");

result = Regex.Replace(result, @"(\r\r)+", "\r\n");

return result;

}

  • 0
    点赞
  • 1
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值