ASP.NET(C#)去除字符串中的html标签
/// <summary>
/// 去除字符串中的html标签
/// </summary>
/// <param name="requestString">要处理的字符串</param>
/// <returns>去除html标签后的字符串</returns>
public static string RemoveHtml(string requestString)
{
//删除脚本
requestString = Regex.Replace(requestString, @"<script[^>]*?>.*?</script>", "", RegexOptions.IgnoreCase);
//删除Html 标签
requestString = Regex.Replace(requestString, @"<(.[^>]*)>", "", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"([\r\n])[\s]+", "", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"-->", "", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"<!--.*", "", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(quot|#34);", "\"", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(amp|#38);", "&", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(lt|#60);", "<", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(gt|#62);", ">", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(nbsp|#160);", " ", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(iexcl|#161);", "\xa1", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(cent|#162);", "\xa2", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(pound|#163);", "\xa3", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&(copy|#169);", "\xa9", RegexOptions.IgnoreCase);
requestString = Regex.Replace(requestString, @"&#(\d+);", "", RegexOptions.IgnoreCase);
//将字符串转换为html编码的字符串。
requestString = System.Web.HttpUtility.HtmlEncode(requestString).Trim();
//返回结果
return requestString;
}
上一篇:C#判断字符串是否为日期型格式
下一篇:C#判断字符串是否为数字型格式