/// <summary> /// {@inheritDoc} /// </summary> public override bool IncrementToken() { while (input.IncrementToken()) { char[] term = termAttribute.Buffer(); int length = termAttribute.Length; int posIncrement = posIncAttribute.PositionIncrement; if (posIncrement > 0) { previous.Clear(); } bool duplicate = (posIncrement == 0 && previous.Contains(term, 0, length)); // clone the term, and add to the set of seen terms. char[] saved = new char[length]; Array.Copy(term, 0, saved, 0, length); previous.Add(saved); if (!duplicate) { return(true); } } return(false); }
public virtual void TestClear() { var set = new CharArraySet(TEST_VERSION_CURRENT, 10, true); set.AddAll(TEST_STOP_WORDS); assertEquals("Not all words added", TEST_STOP_WORDS.Length, set.size()); set.Clear(); assertEquals("not empty", 0, set.size()); for (var i = 0; i < TEST_STOP_WORDS.Length; i++) { assertFalse(set.Contains(TEST_STOP_WORDS[i])); } set.AddAll(TEST_STOP_WORDS); assertEquals("Not all words added", TEST_STOP_WORDS.Length, set.size()); for (var i = 0; i < TEST_STOP_WORDS.Length; i++) { assertTrue("Set doesn't contain " + TEST_STOP_WORDS[i], set.Contains(TEST_STOP_WORDS[i])); } }
public virtual void TestUnionWithObject() { var originalValues = new string[] { "sally", "sells", "seashells", "by", "the", "sea", "shore" }; CharArraySet target = new CharArraySet(TEST_VERSION_CURRENT, originalValues, false); var existingValuesAsObject = new List<object> { "seashells", "sea", "shore" }; var mixedExistingNonExistingValuesAsObject = new List<object> { "true", "set", "of", "unique", "values", "except", "sells" }; var nonExistingMixedTypes = new object[] { true, (byte)55, (short)44, (int)33, (sbyte)22, (long)11, (char)'\n', "hurray", (uint)99, (ulong)89, (ushort)79, new char[] { 't', 'w', 'o' }, new StringCharSequenceWrapper("testing") }; // Add existing values assertFalse(target.UnionWith(existingValuesAsObject)); assertEquals(7, target.Count); CollectionAssert.AreEquivalent(originalValues, target); // Add mixed existing/non-existing values assertTrue(target.UnionWith(mixedExistingNonExistingValuesAsObject)); assertEquals(13, target.Count); CollectionAssert.AreEquivalent(new string[] { "sally", "sells", "seashells", "by", "the", "sea", "shore", "true", "set", "of", "unique", "values", "except"}, target); target.Clear(); assertEquals(0, target.Count); assertTrue(target.UnionWith(originalValues.Cast<object>())); // Need to cast here because the .NET return type is void for UnionWith. CollectionAssert.AreEquivalent(originalValues, target); // Add mixed types as object assertTrue(target.UnionWith(nonExistingMixedTypes)); assertEquals(20, target.Count); assertTrue(target.Contains(true)); assertTrue(target.Contains((byte)55)); assertTrue(target.Contains((short)44)); assertTrue(target.Contains((int)33)); assertTrue(target.Contains((sbyte)22)); assertTrue(target.Contains((long)11)); assertTrue(target.Contains((char)'\n')); assertTrue(target.Contains("hurray")); assertTrue(target.Contains((uint)99)); assertTrue(target.Contains((ulong)89)); assertTrue(target.Contains((ushort)79)); assertTrue(target.Contains(new char[] { 't', 'w', 'o' })); assertTrue(target.Contains(new StringCharSequenceWrapper("testing"))); }