清除文本中Html的标签

2021-05-08 02:29

阅读:578

标签:reg   click   embed   pre   正则表达式   option   summary   替换   amp   

///   
/// 清除文本中Html的标签  
///   
///   
///   
protected string ClearHtml(string Content)
{
    Content = ReplaceHtml("[^>]*;", "", Content);
    Content = ReplaceHtml("?marquee[^>]*>", "", Content);
    Content = ReplaceHtml("?object[^>]*>", "", Content);
    Content = ReplaceHtml("?param[^>]*>", "", Content);
    Content = ReplaceHtml("?embed[^>]*>", "", Content);
    Content = ReplaceHtml("?table[^>]*>", "", Content);
    Content = ReplaceHtml(" ", "", Content);
    Content = ReplaceHtml("?tr[^>]*>", "", Content);
    Content = ReplaceHtml("?th[^>]*>", "", Content);
    Content = ReplaceHtml("?p[^>]*>", "", Content);
    Content = ReplaceHtml("?a[^>]*>", "", Content);
    Content = ReplaceHtml("?img[^>]*>", "", Content);
    Content = ReplaceHtml("?tbody[^>]*>", "", Content);
    Content = ReplaceHtml("?li[^>]*>", "", Content);
    Content = ReplaceHtml("?span[^>]*>", "", Content);
    Content = ReplaceHtml("?div[^>]*>", "", Content);
    Content = ReplaceHtml("?th[^>]*>", "", Content);
    Content = ReplaceHtml("?td[^>]*>", "", Content);
    Content = ReplaceHtml("?script[^>]*>", "", Content);
    Content = ReplaceHtml("(javascript|jscript|vbscript|vbs):", "", Content);
    Content = ReplaceHtml("on(mouse|exit|error|click|key)", "", Content);
    Content = ReplaceHtml("]*>", "", Content);
    Content = ReplaceHtml("]*>", "", Content);
    Content = ReplaceHtml("?font[^>]*>", "", Content);
    Content = ReplaceHtml("?b[^>]*>", "", Content);
    Content = ReplaceHtml("?u[^>]*>", "", Content);
    Content = ReplaceHtml("?i[^>]*>", "", Content);
    Content = ReplaceHtml("?strong[^>]*>", "", Content);
    string clearHtml = Content;
    return clearHtml;
}
///   
/// 清除文本中的Html标签  
///   
/// 要替换的标签正则表达式  
/// 替换为的内容  
/// 要替换的内容  
///   
private string ReplaceHtml(string patrn, string strRep, string content)
{
    if (string.IsNullOrEmpty(content))
    {
        content = "";
    }
    Regex rgEx = new Regex(patrn, RegexOptions.IgnoreCase);
    string strTxt = rgEx.Replace(content, strRep);
    return strTxt;
}
                  

清除文本中Html的标签

标签:reg   click   embed   pre   正则表达式   option   summary   替换   amp   

原文地址:https://www.cnblogs.com/TTonly/p/12082927.html


评论


亲,登录后才可以留言!