zoukankan      html  css  js  c++  java
  • ASP.NET 去除所有HTML标记的方法

    using System.Text.RegularExpressions
    
    ///   <summary>   
      ///    去除HTML标记   
      ///   </summary>   
      ///   <param    name="NoHTML">包括HTML的源码   </param>   
      ///   <returns>已经去除后的文字</returns>   
      public   static   string    NoHTML(string    Htmlstring)   
      {   
      //删除脚本   
       Htmlstring   =    Regex.Replace(Htmlstring,@"<script[^>]*?>.*?</script>","",RegexOptions.IgnoreCase);   
      //删除HTML   
       Htmlstring   =    Regex.Replace(Htmlstring,@"<(.[^>]*)>","",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"([
    ])[s]+","",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"-->","",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"<!--.*","",RegexOptions.IgnoreCase);   
        
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(quot|#34);",""",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(amp|#38);","&",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(lt|#60);","<",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(gt|#62);",">",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(nbsp|#160);","   ",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(iexcl|#161);","xa1",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(cent|#162);","xa2",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(pound|#163);","xa3",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,@"&(copy|#169);","xa9",RegexOptions.IgnoreCase);   
       Htmlstring   =    Regex.Replace(Htmlstring,   @"&#(d+);","",RegexOptions.IgnoreCase);   
        
       Htmlstring.Replace("<","");   
       Htmlstring.Replace(">","");   
       Htmlstring.Replace("
    ","");   
       Htmlstring=HttpContext.Current.Server.HtmlEncode(Htmlstring).Trim();   
        
      return    Htmlstring;   
       }
    
     
    
    写一个静态方法   
      #region    移除HTML标签   
      ///   <summary>   
      ///    移除HTML标签   
      ///   </summary>   
      ///   <param    name="HTMLStr">HTMLStr</param>   
      public   static   string      ParseTags(string    HTMLStr)   
      {   
      return    System.Text.RegularExpressions.Regex.Replace(HTMLStr,   "<[^>]*>",   "");     
       }   
        
      #endregion   
        
                      #region    取出文本中的图片地址   
                      ///   <summary>   
                      ///    取出文本中的图片地址   
                      ///   </summary>   
                      ///   <param    name="HTMLStr">HTMLStr</param>   
                      public   static   string    GetImgUrl(string    HTMLStr)   
                      {   
                              string    str   =   string.Empty;   
                              string    sPattern   =   @"^<imgs+[^>]*>";   
                               Regex    r   =   new    Regex(@"<imgs+[^>]*s*srcs*=s*([']?)(?<url>S+)'?[^>]*>",   
                                       RegexOptions.Compiled);   
                               Match    m   =    r.Match(HTMLStr.ToLower());   
                              if    (m.Success)   
                                       str   =    m.Result("${url}");   
                              return    str;   
                       }   
        
                      #endregion
    

      

  • 相关阅读:
    ASP.NET Core新书终于上市,完成今年一个目标,赠书活动
    .NET 5.0 RC2 发布,正式版即将在 11 月 .NET Conf 大会上发布
    .NET Standard 来日苦短去日长
    [C#.NET 拾遗补漏]09:数据标注与数据校验
    几个超级实用但很少人知道的 VS 技巧[更新]
    .NET 5 中 Target Framework 详解
    .NET 5.0 RC1 发布,离正式版发布仅剩两个版本
    Git 实用操作:撤销 Commit 提交(动图讲解)
    Git 实用操作:重写 Commit 历史
    [C#.NET 拾遗补漏]08:强大的LINQ
  • 原文地址:https://www.cnblogs.com/suzh/p/3433825.html
Copyright © 2011-2022 走看看