/// <summary> /// 查找并替换 ///使用方法 /// string returnstr = "";//返回已经替换的敏感词 ///string str = System.AppDomain.CurrentDomain.SetupInformation.ApplicationBase; ///fw.DictionaryPath = str + "sensitive.txt"; ///fw.SourctText = txttest.Value.Trim(); /// returnstr = fw.Filter('*');//*为要替换成的字符 /// </summary> /// <param name="replaceChar">替换成的字符</param> public string Filter(char replaceChar) { LoadDictionary(); if (_sourctText != string.Empty) { char[] tempString = _sourctText.ToCharArray();; for (int i = 0; i < SourctText.Length; i++) { //查询以该字为首字符的词组 WordGroup group = _memorylexicon[(int)ToDbc(SourctText)[i]]; if (group != null) { for (int z = 0; z < group.Count(); z++) { string word = group.GetWord(z); if (word.Length == 0 || Check(word)) { string blackword = string.Empty; for (int pos = 0; pos < _wordlenght + 1; pos++) { blackword += tempString[pos + _cursor].ToString(); tempString[pos + _cursor] = replaceChar; } _illegalWords.Add(blackword); _cursor = _cursor + _wordlenght; i = i + _wordlenght; } } } _cursor++; } return(new string(tempString)); } else { return(string.Empty); } }
/// <summary> /// 加载内存词库 /// </summary> private void LoadDictionary() { if (DictionaryPath != string.Empty) { List <string> wordList = new List <string>(); Array.Clear(_memorylexicon, 0, _memorylexicon.Length); string[] words = System.IO.File.ReadAllLines(DictionaryPath, System.Text.Encoding.UTF8); foreach (string word in words) { string key = this.ToDbc(word); wordList.Add(key); wordList.Add(Microsoft.VisualBasic.Strings.StrConv(key, Microsoft.VisualBasic.VbStrConv.TraditionalChinese, 0)); } Comparison <string> cmp = delegate(string key1, string key2) { return(key1.CompareTo(key2)); }; wordList.Sort(cmp); for (int i = wordList.Count - 1; i > 0; i--) { if (wordList[i].ToString() == wordList[i - 1].ToString()) { wordList.RemoveAt(i); } } foreach (var word in wordList) { WordGroup group = _memorylexicon[(int)word[0]]; if (group == null) { group = new WordGroup(); _memorylexicon[(int)word[0]] = group; } group.Add(word.Substring(1)); } } }