Пример #1
0
        /// <summary> Creates a TokenStream which tokenizes all the text in the provided Reader.
        ///
        /// </summary>
        /// <returns>  A TokenStream build from a RussianLetterTokenizer filtered with
        /// RussianLowerCaseFilter, StopFilter, and RussianStemFilter
        /// </returns>
        public override TokenStream TokenStream(System.String fieldName, System.IO.TextReader reader)
        {
            TokenStream result = new RussianLetterTokenizer(reader, charset);

            result = new RussianLowerCaseFilter(result, charset);
            result = new StopFilter(result, stopSet);
            result = new RussianStemFilter(result, charset);
            return(result);
        }
Пример #2
0
        /// <summary> Creates a TokenStream which tokenizes all the text in the provided Reader.
        ///
        /// </summary>
        /// <returns> A TokenStream build from a StandardTokenizer filtered with
        /// StandardFilter, LowerCaseFilter, StopFilter, GermanStemFilter
        /// </returns>
        public override TokenStream TokenStream(System.String fieldName, System.IO.TextReader reader)
        {
            TokenStream result = new StandardTokenizer(reader);

            result = new StandardFilter(result);
            result = new LowerCaseFilter(result);
            result = new StopFilter(result, stopSet);
            result = new GermanStemFilter(result, exclusionSet);
            return(result);
        }
		/// <summary> Creates a TokenStream which tokenizes all the text in the provided Reader.
		/// 
		/// </summary>
		/// <returns> A TokenStream build from a StandardTokenizer filtered with
		/// StandardFilter, LowerCaseFilter, StopFilter, GermanStemFilter
		/// </returns>
		public override TokenStream TokenStream(System.String fieldName, System.IO.TextReader reader)
		{
			TokenStream result = new StandardTokenizer(reader);
			result = new StandardFilter(result);
			result = new LowerCaseFilter(result);
			result = new StopFilter(result, stopSet);
			result = new GermanStemFilter(result, exclusionSet);
			return result;
		}
		/// <summary> Creates a TokenStream which tokenizes all the text in the provided Reader.
		/// 
		/// </summary>
		/// <returns>  A TokenStream build from a RussianLetterTokenizer filtered with
		/// RussianLowerCaseFilter, StopFilter, and RussianStemFilter
		/// </returns>
		public override TokenStream TokenStream(System.String fieldName, System.IO.TextReader reader)
		{
			TokenStream result = new RussianLetterTokenizer(reader, charset);
			result = new RussianLowerCaseFilter(result, charset);
			result = new StopFilter(result, stopSet);
			result = new RussianStemFilter(result, charset);
			return result;
		}
Пример #5
0
 /// <summary> Builds an exclusionlist from an array of Strings.</summary>
 public virtual void  SetStemExclusionTable(System.String[] exclusionlist)
 {
     exclusionSet = StopFilter.MakeStopSet(exclusionlist);
 }
Пример #6
0
 /// <summary> Builds an analyzer with the given stop words.</summary>
 public GermanAnalyzer(System.String[] stopwords)
 {
     stopSet = StopFilter.MakeStopSet(stopwords);
 }
Пример #7
0
 /// <summary> Builds an analyzer.</summary>
 public GermanAnalyzer()
 {
     stopSet = StopFilter.MakeStopSet(GERMAN_STOP_WORDS);
 }
Пример #8
0
 /// <summary> Builds an analyzer with the given stop words.</summary>
 public RussianAnalyzer(char[] charset, System.String[] stopwords)
 {
     this.charset = charset;
     stopSet      = StopFilter.MakeStopSet(stopwords);
 }
Пример #9
0
 /// <summary> Builds an analyzer.</summary>
 public RussianAnalyzer(char[] charset)
 {
     this.charset = charset;
     stopSet      = StopFilter.MakeStopSet(makeStopWords(charset));
 }
Пример #10
0
 public RussianAnalyzer()
 {
     charset = RussianCharsets.UnicodeRussian;
     stopSet = StopFilter.MakeStopSet(makeStopWords(RussianCharsets.UnicodeRussian));
 }