zoukankan      html  css  js  c++  java
  • 【转】C# 过滤HTML,脚本,数据库关键字,特殊字符

        /// <summary>
    /// 过滤标记
    /// </summary>
    /// <param name="NoHTML">包括HTML,脚本,数据库关键字,特殊字符的源码 </param>
    /// <returns>已经去除标记后的文字</returns>
    public static string NoHTML(string Htmlstring)
    {
    if (Htmlstring == null)
    {
    return "";
    }
    else
    {
    //删除脚本
    Htmlstring = Regex.Replace(Htmlstring, @"<script[^>]*?>.*?</script>", "", RegexOptions.IgnoreCase);
    //删除HTML
    Htmlstring = Regex.Replace(Htmlstring, @"<(.[^>]*)>", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"([\r\n])[\s]+", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"-->", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"<!--.*", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(quot|#34);", "\"", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(amp|#38);", "&", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(lt|#60);", "<", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(gt|#62);", ">", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(nbsp|#160);", " ", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(iexcl|#161);", "\xa1", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(cent|#162);", "\xa2", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(pound|#163);", "\xa3", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&(copy|#169);", "\xa9", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, @"&#(\d+);", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "xp_cmdshell", "", RegexOptions.IgnoreCase);

    //删除与数据库相关的词
    Htmlstring = Regex.Replace(Htmlstring, "select", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "insert", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "delete from", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "count''", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "drop table", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "truncate", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "asc", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "mid", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "char", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "xp_cmdshell", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "exec master", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "net localgroup administrators", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "and", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "net user", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "or", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "net", "", RegexOptions.IgnoreCase);
    //Htmlstring = Regex.Replace(Htmlstring,"*", "", RegexOptions.IgnoreCase);
    //Htmlstring = Regex.Replace(Htmlstring,"-", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "delete", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "drop", "", RegexOptions.IgnoreCase);
    Htmlstring = Regex.Replace(Htmlstring, "script", "", RegexOptions.IgnoreCase);

    //特殊的字符
    Htmlstring = Htmlstring.Replace("<", "");
    Htmlstring = Htmlstring.Replace(">", "");
    Htmlstring = Htmlstring.Replace("*", "");
    Htmlstring = Htmlstring.Replace("-", "");
    Htmlstring = Htmlstring.Replace("?", "");
    Htmlstring = Htmlstring.Replace(",", "");
    Htmlstring = Htmlstring.Replace("/", "");
    Htmlstring = Htmlstring.Replace(";", "");
    Htmlstring = Htmlstring.Replace("*/", "");
    Htmlstring = Htmlstring.Replace("\r\n", "");
    Htmlstring = HttpContext.Current.Server.HtmlEncode(Htmlstring).Trim();

    return Htmlstring;
    }

    }

    转自:http://hi.baidu.com/squirrel_/blog/item/7c4c083b9b8384e714cecb7f.html

  • 相关阅读:
    黄聪: PHP WkHtmlToPdf/WkHtmlToImage 将网页直接转换成pdf和图片
    黄聪:PHP页面跳转如何实现延时跳转
    黄聪:wkhtmltopdf解决分页问题
    黄聪:wkhtmtopdf--高分辨率HTML转PDF
    黄聪:Wordpress二级域名共享用户cookie出现错误解决方案及WP的Cookie机制
    黄聪:wordpress向一个页面POST数据,出现404页面访问不了
    黄聪:PHP解决textarea内容换行存入数据库,如何解析取出不能自动换行
    黄聪:PHP7.0中htmlspecialchars出错解决方案(wordpress)
    黄聪:WordPress: 使用 wp_insert_attachment 上传附件
    黄聪: 50 个 Bootstrap 插件
  • 原文地址:https://www.cnblogs.com/dupeng0811/p/2383743.html
Copyright © 2011-2022 走看看