zoukankan      html  css  js  c++  java
  • 去除html

     /// <summary>
            /// 将HTML去除  
            /// </summary>
            /// <param name="Htmlstring"></param>
            /// <returns></returns>
            public static string DelHTML(string Htmlstring)
            {
                #region
                //删除脚本 
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"<script[^>]*?>.*?</script>", "", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                //删除HTML 
    
                //Htmlstring =System.Text.RegularExpressions. Regex.Replace(Htmlstring,@"<A>.*</A>",""); 
                //Htmlstring =System.Text.RegularExpressions. Regex.Replace(Htmlstring,@"<[a-zA-Z]*=.[a-zA-Z]*?[a-zA-Z]+=d&w=%[a-zA-Z]*|[A-Z0-9]",""); 
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(quot|#34);", "", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(amp|#38);", "&", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(lt|#60);", "<", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(gt|#62);", ">", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(nbsp|#160);", " ", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(iexcl|#161);", "xa1", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(cent|#162);", "xa2", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(pound|#163);", "xa3", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(copy|#169);", "xa9", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&#(d+);", "", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"<(.[^>]*)>", "", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"([
    ])[s]+", "", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"-->", "", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"<!--.*", "", System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring = System.Text.RegularExpressions.Regex.Replace(Htmlstring, @"&(quot|#34);", """, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
                Htmlstring.Replace("<", "");
                Htmlstring.Replace(">", "");
                Htmlstring.Replace("
    ", "");
                //Htmlstring=HttpContext.Current.Server.HtmlEncode(Htmlstring).Trim(); 
                #endregion
                return Htmlstring;
            }
  • 相关阅读:
    Python之美[从菜鸟到高手]--Python垃圾回收机制及gc模块详解
    linux-memory-buffer-vs-cache
    MYSQL----myownstars(102)
    win10系统调用架构分析
    on io scheduling again
    Java并发编程
    elixir-lang
    mydumper工作原理, seconds_behind_master的陷阱和pt-heartbeat (102)
    深入理解JavaScript系列+ 深入理解javascript之执行上下文
    我们应该如何去了解JavaScript引擎的工作原理 系列
  • 原文地址:https://www.cnblogs.com/mengxingxinqing/p/3164910.html
Copyright © 2011-2022 走看看