关键字加链接
private static readonly Regex reg_b = new Regex(@"\B", RegexOptions.Compiled);
private static readonly Regex reg_en = new Regex(@"[a-zA-Z]+", RegexOptions.Compiled);
private static readonly Regex reg_num = new Regex(@"^[\-\.\s\d]+$", RegexOptions.Compiled);
private static Regex reg_word = null; //组合所有屏蔽词的正则
private static Regex GetRegex()
{
if (reg_word == null)
{
reg_word = new Regex(GetPattern(), RegexOptions.Compiled | RegexOptions.IgnoreCase);
}
return reg_word;
}
/// <summary>
/// 检查输入内容是否包含脏词(包含返回true)
/// </summary>
public static bool HasBlockWords(string raw)
{
return GetRegex().Match(raw).Success;
}
/// <summary>
/// 脏词替换成*号
/// </summary>
public static string WordsFilter(string raw)
{
return GetRegex().Replace(raw, "***");
}
/// <summary>
/// 获取内容中含有的脏词
/// </summary>
public static IEnumerable<string> GetBlockWords(string raw)
{
foreach (Match mat in reg_word.Matches(raw))
{
yield return (mat.Value);
}
}
private static string GetPattern()
{
StringBuilder patt = new StringBuilder();
string s;
foreach (string word in GetBlockWords())
{
if (word.Length == 0) continue;
if (word.Length == 1)
{
patt.AppendFormat("|({0})", word);
}
else if (reg_num.IsMatch(word))
{
patt.AppendFormat("|({0})", word);
}
else if (reg_en.IsMatch(word))
{
s = reg_b.Replace(word, @"(?:[^a-zA-Z]{0,3})");
patt.AppendFormat("|({0})", s);
}
else
{
s = reg_b.Replace(word, @"(?:[^\u4e00-\u9fa5]{0,3})");
patt.AppendFormat("|({0})", s);
}
}
if (patt.Length > 0)
{
patt.Remove(0, 1);
}
return patt.ToString();
}
/// <summary>
/// 获取所有脏词
/// </summary>
public static string[] GetBlockWords()
{
return new string[]{"国民党","fuck","110"};//这里应该从数据库获取
}
private static readonly Regex reg_en = new Regex(@"[a-zA-Z]+", RegexOptions.Compiled);
private static readonly Regex reg_num = new Regex(@"^[\-\.\s\d]+$", RegexOptions.Compiled);
private static Regex reg_word = null; //组合所有屏蔽词的正则
private static Regex GetRegex()
{
if (reg_word == null)
{
reg_word = new Regex(GetPattern(), RegexOptions.Compiled | RegexOptions.IgnoreCase);
}
return reg_word;
}
/// <summary>
/// 检查输入内容是否包含脏词(包含返回true)
/// </summary>
public static bool HasBlockWords(string raw)
{
return GetRegex().Match(raw).Success;
}
/// <summary>
/// 脏词替换成*号
/// </summary>
public static string WordsFilter(string raw)
{
return GetRegex().Replace(raw, "***");
}
/// <summary>
/// 获取内容中含有的脏词
/// </summary>
public static IEnumerable<string> GetBlockWords(string raw)
{
foreach (Match mat in reg_word.Matches(raw))
{
yield return (mat.Value);
}
}
private static string GetPattern()
{
StringBuilder patt = new StringBuilder();
string s;
foreach (string word in GetBlockWords())
{
if (word.Length == 0) continue;
if (word.Length == 1)
{
patt.AppendFormat("|({0})", word);
}
else if (reg_num.IsMatch(word))
{
patt.AppendFormat("|({0})", word);
}
else if (reg_en.IsMatch(word))
{
s = reg_b.Replace(word, @"(?:[^a-zA-Z]{0,3})");
patt.AppendFormat("|({0})", s);
}
else
{
s = reg_b.Replace(word, @"(?:[^\u4e00-\u9fa5]{0,3})");
patt.AppendFormat("|({0})", s);
}
}
if (patt.Length > 0)
{
patt.Remove(0, 1);
}
return patt.ToString();
}
/// <summary>
/// 获取所有脏词
/// </summary>
public static string[] GetBlockWords()
{
return new string[]{"国民党","fuck","110"};//这里应该从数据库获取
}
作者:Bober Song
出处:http://bober.cnblogs.com/
CARE健康网: http://www.aicareyou.com/
本文版权归作者和博客园共有,欢迎转载,但未经作者同意必须保留此段声明,且在文章页面明显位置给出原文连接,否则保留追究法律责任的权利。
出处:http://bober.cnblogs.com/
CARE健康网: http://www.aicareyou.com/
本文版权归作者和博客园共有,欢迎转载,但未经作者同意必须保留此段声明,且在文章页面明显位置给出原文连接,否则保留追究法律责任的权利。