A stemmer for German words.

The algorithm is based on the report "A Fast and Simple Stemming Algorithm for German Words" by Jörg Caumanns (joerg.caumanns at isst.fhg.de).

Пример #1
0
 /// <summary>
 /// Set a alternative/custom GermanStemmer for this filter.
 /// </summary>
 /// <param name="stemmer"></param>
 public void SetStemmer(GermanStemmer stemmer)
 {
     if (stemmer != null)
     {
         this.stemmer = stemmer;
     }
 }
Пример #2
0
		/// <summary>
		/// Set a alternative/custom GermanStemmer for this filter. 
		/// </summary>
		/// <param name="stemmer"></param>
		public void SetStemmer( GermanStemmer stemmer )
		{
			if ( stemmer != null ) 
			{
				this.stemmer = stemmer;
			}
		}
Пример #3
0
 /// <summary>
 /// Builds a GermanStemFilter that uses an exclusiontable.
 /// </summary>
 /// <param name="_in"></param>
 /// <param name="exclusiontable"></param>
 /// <param name="normalizeDin2">Specifies if the DIN-2007-2 style stemmer should be used in addition to DIN1.  This
 /// will cause words with 'ae', 'ue', or 'oe' in them (expanded umlauts) to be first converted to 'a', 'u', and 'o'
 /// respectively, before the DIN1 stemmer is invoked.</param>
 public GermanStemFilter(TokenStream _in, ISet <string> exclusiontable, bool normalizeDin2)
     : base(_in)
 {
     exclusionSet = exclusiontable;
     stemmer      = normalizeDin2 ? new GermanDIN2Stemmer() : new GermanStemmer();
     termAtt      = AddAttribute <ITermAttribute>();
 }
Пример #4
0
 /// <summary>
 /// Builds a GermanStemFilter that uses an exclusiontable. 
 /// </summary>
 /// <param name="_in"></param>
 /// <param name="exclusiontable"></param>
 /// <param name="normalizeDin2">Specifies if the DIN-2007-2 style stemmer should be used in addition to DIN1.  This
 /// will cause words with 'ae', 'ue', or 'oe' in them (expanded umlauts) to be first converted to 'a', 'u', and 'o'
 /// respectively, before the DIN1 stemmer is invoked.</param>
 public GermanStemFilter(TokenStream _in, ISet<string> exclusiontable, bool normalizeDin2)
     : base(_in)
 {
     exclusionSet = exclusiontable;
     stemmer = normalizeDin2 ? new GermanDIN2Stemmer() : new GermanStemmer();
     termAtt = AddAttribute<ITermAttribute>();
 }
Пример #5
0
 public GermanStemFilter(TokenStream _in) : base(_in)
 {
     stemmer = new GermanStemmer();
 }
Пример #6
0
		public GermanStemFilter( TokenStream _in ) : base(_in)
		{
			stemmer = new GermanStemmer();
		}