zoukankan
html css js c++ java
过滤HTML字符显示摘要
public
static
string
GetSummary(
string
html,
int
summaryLength)
{
string
text
=
GetHtmlText(html);
text
=
DelHTML(text);
text
=
Strtitle(text);
if
(summaryLength
>=
text.Length)
return
text;
return
text.Substring(
0
, summaryLength)
+
"
"
;
}
public
static
string
GetHtmlText(
string
html)
{
return
System.Text.RegularExpressions.Regex.Replace(html,
@"
<[^>]*>
"
,
""
);
}
public
static
string
DelHTML(
string
Htmlstring)
//
将HTML去除
{
#region
//
删除脚本
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
<script[^>]*?>.*?</script>
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
//
删除HTML
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
<(.[^>]*)>
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
([\r\n])[\s]+
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
-->
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
<!--.*
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
//
Htmlstring =System.Text.RegularExpressions. Regex.Replace(Htmlstring,@"<A>.*</A>","");
//
Htmlstring =System.Text.RegularExpressions. Regex.Replace(Htmlstring,@"<[a-zA-Z]*=\.[a-zA-Z]*\?[a-zA-Z]+=\d&\w=%[a-zA-Z]*|[A-Z0-9]","");
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(quot|#34);
"
,
"
\
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(amp|#38);
"
,
"
&
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(lt|#60);
"
,
"
<
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(gt|#62);
"
,
"
>
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(nbsp|#160);
"
,
"
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(iexcl|#161);
"
,
"
\xa1
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(cent|#162);
"
,
"
\xa2
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(pound|#163);
"
,
"
\xa3
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(copy|#169);
"
,
"
\xa9
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&#(\d+);
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring.Replace(
"
<
"
,
""
);
Htmlstring.Replace(
"
>
"
,
""
);
Htmlstring.Replace(
"
\r\n
"
,
""
);
//
Htmlstring=HttpContext.Current.Server.HtmlEncode(Htmlstring).Trim();
#endregion
return
Htmlstring.Trim();
}
public
static
string
DelWords(
string
strtitle)
{
string
strContent
=
strtitle;
strtitle
=
Regex.Replace(strContent,
"
(<H1.*?>|</H1>|</br>|<SPAN.*?>|</SPAN>|<FONT.*?>||<o:p></o:p>)
"
,
""
);
strContent
=
strtitle;
strContent
=
Regex.Replace(strContent,
"
(<IMG.*?>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(<P.*?>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(<P>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
( )
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(”)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(</P>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(</BR>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(<BR>)
"
,
""
);
strContent
=
strContent.Replace(
"
<?xml:namespace prefix = o ns = 'urn:schemas-microsoft-com:office:office'/>
"
,
""
);
return
strtitle;
}
查看全文
相关阅读:
Java 执行
Java 反射
Mysql 日常
Java 引用
Mysql insert on update
Java Mail 异常
HDU_5456_数位dp
HDU_4734_数位dp
POJ_1221_DP
POJ_1050_最大子矩阵
原文地址:https://www.cnblogs.com/cnaspnet/p/1216790.html
最新文章
【题解】[CSP-S 2020] 儒略日【大模拟】
【题解】[codeforces 617E] XOR and Favorite Number【莫队】
扩展Lucas定理 学习笔记
Lucas定理 学习笔记
【洛谷P4774】 [NOI2018] 屠龙勇士【exCRT】
中国剩余定理/扩展中国剩余定理 学习笔记
必须Mark!43个优秀的Swift开源项目推荐
Swift中的HTTP请求
mysql将字符转换成数字
Android中使用WebView, WebChromeClient和WebViewClient加载网页 (能够执行js)
热门文章
android中两种方式打开网页
Android:控件WebView显示网页
JAVA除法保留小数点后两位的两种方法 Java Math的 floor,round和ceil的总结
FileMode文件模式
C#读写txt文件的两种方法介绍
C#判断文件及文件夹是否存在并创建(C#判断文件夹存在)
Hive 问题
Spring中获取request的几种方法,及其线程安全性分析
Java 包扫描器
Shell 日常 ip 端口可用性测试
Copyright © 2011-2022 走看看