示例#1
0
        public override TokenStream TokenStream(string fieldName, System.IO.TextReader reader)
        {
            var seg = new JiebaSegmenter();
            TokenStream result = new JiebaTokenizer(seg, reader);

            result = new LowerCaseFilter(result);
            result = new StopFilter(true, result, StopWords);
            return result;
        }
示例#2
0
        public override TokenStream TokenStream(string fieldName, System.IO.TextReader reader)
        {
            var         seg    = new JiebaSegmenter();
            TokenStream result = new JiebaTokenizer(seg, reader);

            result = new LowerCaseFilter(result);
            result = new StopFilter(true, result, StopWords);
            return(result);
        }
示例#3
0
        private static string GetKeyWordsSplitBySpace(string keywords, JiebaTokenizer tokenizer)
        {
            var result = new StringBuilder();
            var words  = tokenizer.Tokenize(keywords);

            foreach (var word in words)
            {
                if (string.IsNullOrWhiteSpace(word.Word))
                {
                    continue;
                }
                result.AppendFormat("{0} ", word.Word);
            }
            return(result.ToString().Trim());
        }
示例#4
0
 private static string GetKeyWordsSplitBySpace(string keywords, JiebaTokenizer tokenizer)
 {
     var result = new StringBuilder();
     var words = tokenizer.Tokenize(keywords);
     foreach (var word in words)
     {
         if (string.IsNullOrWhiteSpace(word.Word))
         {
             continue;
         }
         result.AppendFormat("{0} ", word.Word);
     }
     return result.ToString().Trim();
 }