asp.net中如何把一个字符串中的所有html代码去掉成为文本模式
2012-02-28 14:07
756 查看
public string ClearHtml(string HtmlStr)
{
string tmpStr = HtmlStr;
tmpStr = ReplaceHtml("[^>]*;", tmpStr, "");
tmpStr = ReplaceHtml("</?marquee[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?object[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?param[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?embed[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?table[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml(" ", tmpStr, "");
tmpStr = ReplaceHtml("</?tr[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?th[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?p[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?a[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?img[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?tbody[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?li[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?span[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?div[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?th[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?td[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?script[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("(javascript|jscript|vbscript|vbs):", tmpStr, "");
tmpStr = ReplaceHtml("on(mouse|exit|error|click|key)", tmpStr, "");
tmpStr = ReplaceHtml("<\\?xml[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("<\\/?[a-z]+:[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?font[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?b[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?u[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?i[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?strong[^>]*>", tmpStr, "");
return tmpStr;
}
public string ReplaceHtml(string Pattern, string HtmlStr, string replacement)
{
System.Text.RegularExpressions.Regex rx = new System.Text.RegularExpressions.Regex(Pattern,System.Text.RegularExpressions.RegexOptions.IgnoreCase);
if(rx.IsMatch(HtmlStr))
return rx.Replace(HtmlStr, replacement);
return HtmlStr;
}
{
string tmpStr = HtmlStr;
tmpStr = ReplaceHtml("[^>]*;", tmpStr, "");
tmpStr = ReplaceHtml("</?marquee[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?object[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?param[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?embed[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?table[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml(" ", tmpStr, "");
tmpStr = ReplaceHtml("</?tr[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?th[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?p[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?a[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?img[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?tbody[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?li[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?span[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?div[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?th[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?td[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?script[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("(javascript|jscript|vbscript|vbs):", tmpStr, "");
tmpStr = ReplaceHtml("on(mouse|exit|error|click|key)", tmpStr, "");
tmpStr = ReplaceHtml("<\\?xml[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("<\\/?[a-z]+:[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?font[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?b[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?u[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?i[^>]*>", tmpStr, "");
tmpStr = ReplaceHtml("</?strong[^>]*>", tmpStr, "");
return tmpStr;
}
public string ReplaceHtml(string Pattern, string HtmlStr, string replacement)
{
System.Text.RegularExpressions.Regex rx = new System.Text.RegularExpressions.Regex(Pattern,System.Text.RegularExpressions.RegexOptions.IgnoreCase);
if(rx.IsMatch(HtmlStr))
return rx.Replace(HtmlStr, replacement);
return HtmlStr;
}
相关文章推荐
- 关于asp.net(c#),webconfig中如何定义一个字符串让所有页面共同使用?
- Asp.Net中的字符串和HTML十进制编码转换实现代码
- asp.net中利用正则表达式判断一个字符串是否为数字的代码
- ASP.NET MVC @Html.DropDownList()如何去掉空白项
- asp.net如何去掉HTML标记
- 去掉asp.net自动生成的垃圾代码的一个类,
- asp.net如何去掉HTML标记
- asp.net如何去掉HTML标记
- 去掉asp.net自动生成的垃圾代码的一个类
- Asp.net MVC 如何对所有用户输入的字符串字段做Trim处理
- 请问我如何在一个webBrowser控件中加载一个 html格式的字符串 - _NET技术 - C#
- Asp.net中如何过滤html,js,css代码
- Asp.net中如何过滤html,js,css代码
- [VB.NET]VB.NET中如何向网页提交一个请求,并得到返回的HTML代码?
- Asp.net中如何过滤html,js,css代码
- asp.net如何去掉HTML标记
- Asp.net中如何过滤html,js,css代码
- 在Asp.net中如何遍历一个本地目录下的所有文件并上载到Web 服务器上指定的目录中
- asp.net去掉HTML标记代码
- asp.net中利用正则表达式判断一个字符串是否为数字的代码