zoukankan
html css js c++ java
过滤HTML字符显示摘要
public
static
string
GetSummary(
string
html,
int
summaryLength)
{
string
text
=
GetHtmlText(html);
text
=
DelHTML(text);
text
=
Strtitle(text);
if
(summaryLength
>=
text.Length)
return
text;
return
text.Substring(
0
, summaryLength)
+
"
"
;
}
public
static
string
GetHtmlText(
string
html)
{
return
System.Text.RegularExpressions.Regex.Replace(html,
@"
<[^>]*>
"
,
""
);
}
public
static
string
DelHTML(
string
Htmlstring)
//
将HTML去除
{
#region
//
删除脚本
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
<script[^>]*?>.*?</script>
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
//
删除HTML
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
<(.[^>]*)>
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
([\r\n])[\s]+
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
-->
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
<!--.*
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
//
Htmlstring =System.Text.RegularExpressions. Regex.Replace(Htmlstring,@"<A>.*</A>","");
//
Htmlstring =System.Text.RegularExpressions. Regex.Replace(Htmlstring,@"<[a-zA-Z]*=\.[a-zA-Z]*\?[a-zA-Z]+=\d&\w=%[a-zA-Z]*|[A-Z0-9]","");
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(quot|#34);
"
,
"
\
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(amp|#38);
"
,
"
&
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(lt|#60);
"
,
"
<
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(gt|#62);
"
,
"
>
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(nbsp|#160);
"
,
"
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(iexcl|#161);
"
,
"
\xa1
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(cent|#162);
"
,
"
\xa2
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(pound|#163);
"
,
"
\xa3
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&(copy|#169);
"
,
"
\xa9
"
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring
=
System.Text.RegularExpressions.Regex.Replace(Htmlstring,
@"
&#(\d+);
"
,
""
, System.Text.RegularExpressions.RegexOptions.IgnoreCase);
Htmlstring.Replace(
"
<
"
,
""
);
Htmlstring.Replace(
"
>
"
,
""
);
Htmlstring.Replace(
"
\r\n
"
,
""
);
//
Htmlstring=HttpContext.Current.Server.HtmlEncode(Htmlstring).Trim();
#endregion
return
Htmlstring.Trim();
}
public
static
string
DelWords(
string
strtitle)
{
string
strContent
=
strtitle;
strtitle
=
Regex.Replace(strContent,
"
(<H1.*?>|</H1>|</br>|<SPAN.*?>|</SPAN>|<FONT.*?>||<o:p></o:p>)
"
,
""
);
strContent
=
strtitle;
strContent
=
Regex.Replace(strContent,
"
(<IMG.*?>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(<P.*?>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(<P>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
( )
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(”)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(</P>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(</BR>)
"
,
""
);
strContent
=
Regex.Replace(strContent,
"
(<BR>)
"
,
""
);
strContent
=
strContent.Replace(
"
<?xml:namespace prefix = o ns = 'urn:schemas-microsoft-com:office:office'/>
"
,
""
);
return
strtitle;
}
查看全文
相关阅读:
AESUtil_1
ELK配置
Centos7上安装docker
Excel大批量数据导出
Redis5.0.6安装完整步骤
idea远程打断点
[HNOI2016] 序列
[TJOI2017] 异或和
洛谷 P4933 大师
洛谷 P1950 长方形_NOI导刊2009提高(2)
原文地址:https://www.cnblogs.com/cnaspnet/p/1216790.html
最新文章
JavaScript中this关键字的使用比较
使用Ant和YUICompressor链接合并压缩你的JS和CSS代码
IE6+以上清除浮动普遍方法总结
使用display:table使两栏布局高度相等
自己写的JS排序算法
JS一个根据时区输出时区时间的函数
C语言,C#,Java,JavaScript之强类型与弱类型
LBP特征处理(一)
C++中的移位运算
VS2015——opencv3.4.2扩展库安装
热门文章
HOG特征基础(一)
SURF特征点检测实现
SURF特征点检测原理
亚像素角点检测
SIFT特征点检测实现
SIFT特征点提取
在Docker内安装jenkins运行和基础配置
RSA公钥加密-私钥解密/私钥加密-公钥解密
DESUtil
AESUtil
Copyright © 2011-2022 走看看