C# (CSharp) Lucene.Net.Analysis.Miscellaneous CodepointCountFilter示例

编程语言: C# (CSharp)

命名空间/包名称: Lucene.Net.Analysis.Miscellaneous

hotexamples.com的示例: 4

C# (CSharp) Lucene.Net.Analysis.Miscellaneous CodepointCountFilter - 已找到4个示例。这些是从开源项目中提取的最受好评的Lucene.Net.Analysis.Miscellaneous.CodepointCountFilter现实C# (CSharp)示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

Dispose(1)

End(1)

IncrementToken(1)

Reset(1)

Removes words that are too long or too short from the stream.

Note: Length is calculated as the number of Unicode codepoints.

Inheritance: Lucene.Net.Analysis.Util.FilteringTokenFilter

CodepointCountFilter Class Documentation

示例#1

显示文件

        public virtual void TestFilterWithPosIncr()
        {
            TokenStream          stream = new MockTokenizer(new StringReader("short toolong evenmuchlongertext a ab toolong foo"), MockTokenizer.WHITESPACE, false);
            CodepointCountFilter filter = new CodepointCountFilter(TEST_VERSION_CURRENT, stream, 2, 6);

            AssertTokenStreamContents(filter, new string[] { "short", "ab", "foo" }, new int[] { 1, 4, 2 });
        }

示例#2

显示文件

文件： TestCodepointCountFilter.cs 项目： simixsistemas/lucenenet

 public virtual void TestRandomStrings()
 {
     for (int i = 0; i < 10000; i++)
     {
         string text = TestUtil.RandomUnicodeString(Random, 100);
         int min = TestUtil.NextInt32(Random, 0, 100);
         int max = TestUtil.NextInt32(Random, 0, 100);
         int count = text.CodePointCount(0, text.Length);
         if (min > max)
         {
             int temp = min;
             min = max;
             max = temp;
         }
         bool expected = count >= min && count <= max;
         TokenStream stream = new KeywordTokenizer(new StringReader(text));
         stream = new CodepointCountFilter(TEST_VERSION_CURRENT, stream, min, max);
         stream.Reset();
         assertEquals(expected, stream.IncrementToken());
         stream.End();
         stream.Dispose();
     }
 }

示例#3

显示文件

文件： TestCodepointCountFilter.cs 项目： ChristopherHaws/lucenenet

 public virtual void TestRandomStrings()
 {
     for (int i = 0; i < 10000; i++)
     {
         string text = TestUtil.RandomUnicodeString(Random(), 100);
         int min = TestUtil.NextInt(Random(), 0, 100);
         int max = TestUtil.NextInt(Random(), 0, 100);
         int count = Character.CodePointCount(text, 0, text.Length);// text.codePointCount(0, text.Length);
         if (min > max)
         {
             int temp = min;
             min = max;
             max = temp;
         }
         bool expected = count >= min && count <= max;
         TokenStream stream = new KeywordTokenizer(new StringReader(text));
         stream = new CodepointCountFilter(TEST_VERSION_CURRENT, stream, min, max);
         stream.Reset();
         assertEquals(expected, stream.IncrementToken());
         stream.End();
         stream.Dispose();
     }
 }

示例#4

显示文件

文件： TestCodepointCountFilter.cs 项目： ChristopherHaws/lucenenet

 public virtual void TestFilterWithPosIncr()
 {
     TokenStream stream = new MockTokenizer(new StringReader("short toolong evenmuchlongertext a ab toolong foo"), MockTokenizer.WHITESPACE, false);
     CodepointCountFilter filter = new CodepointCountFilter(TEST_VERSION_CURRENT, stream, 2, 6);
     AssertTokenStreamContents(filter, new string[] { "short", "ab", "foo" }, new int[] { 1, 4, 2 });
 }