C#去除指定字符串中的HTML标签相关代码函数
2008-05-21 11:50
881 查看
//去除指定字符串中的HTML标签相关代码函数
private static string RemoveHtml(string strContent, string strTagName, int strType)
{
string pattern = "";
string strResult = "";
Regex exp;
MatchCollection matchList;
switch (strType)
{
case 1://去掉<a></a>中<a>标记的内容,保留<a>后面的所有代码
pattern = @"<" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
break;
case 2://去掉所有<a></a>两个标记的内容,保留<a>和</a>代码中间的代码
pattern = "<" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
pattern = "</" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
break;
case 3://去掉所有<a></a>和两个标记之间的全部内容
pattern = "<" + strTagName + "([^>])*>.*?</" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
break;
}
return strContent;
}
private static string RemoveHtml(string strContent, string strTagName, int strType)
{
string pattern = "";
string strResult = "";
Regex exp;
MatchCollection matchList;
switch (strType)
{
case 1://去掉<a></a>中<a>标记的内容,保留<a>后面的所有代码
pattern = @"<" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
break;
case 2://去掉所有<a></a>两个标记的内容,保留<a>和</a>代码中间的代码
pattern = "<" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
pattern = "</" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
break;
case 3://去掉所有<a></a>和两个标记之间的全部内容
pattern = "<" + strTagName + "([^>])*>.*?</" + strTagName + "([^>])*>";
exp = new Regex(pattern, RegexOptions.IgnoreCase | RegexOptions.Multiline | RegexOptions.IgnorePatternWhitespace);
matchList = exp.Matches(strContent);
foreach (Match match in matchList)
{
if (match.Value.Length > 0)
strResult = match.Value;
strContent = strContent.Replace(strResult, "");
break;
}
break;
}
return strContent;
}
相关文章推荐
- C#去除指定字符串中的HTML标签相关代码函数
- C#去除指定字符串中的HTML标签相关代码函数
- C#去除指定字符串中的HTML标签
- C#去除指定字符串中的HTML标签
- 用C#去除字符串中HTML的格式(清除数据库中html标签)
- AJ学IOS之去除服务器返回数据中的html标签,去除指定字符串,替换字符串
- 帝国 标签模板 使用程序代码 去除html标记 并 截取字符串
- PHP中strip_tags() 函数的使用方法和介绍,去除字符串中的HTML标签等
- C#使用正则表达式获取HTML代码中a标签里包含指定后缀的href的值
- 猫猫学iOS之去除服务器返回数据中的html标签,去除指定字符串,替换字符串
- C# 去所有 html标签的代码|去除html标签代码
- C# 去所有 html标签的代码|去除html标签代码
- 去除指定字符串中的HTML标签
- 用C#去除字符串中HTML的格式(清除数据库中html标签)
- C#去除一段字符串内的HTML标签,正则表达式
- ASP.NET去除HTML标签并截取指定长度字符串
- C#去除字符串中的html标签
- C#去除HTML标签
- php下清空字符串中的HTML标签的代码
- C#抓取网页数据、分析并且去除HTML标签