/// <summary> /// Create a copy of this iterator </summary> /// <returns> A copy of this </returns> public virtual Object Clone() { CharArrayIterator c = new CharArrayIterator(Chars, Begin); c.Pos = this.Pos; return(c); }
public virtual void TestConsumeSentenceInstance() { // we use the default locale, as its randomized by LuceneTestCase var bi = BreakIterator.CreateSentenceInstance(Locale.GetUS()); var ci = CharArrayIterator.NewSentenceInstance(); for (var i = 0; i < 10000; i++) { var text = TestUtil.RandomUnicodeString(Random()).toCharArray(); ci.SetText(text, 0, text.Length); Consume(bi, ci); } }
private string CharacterIteratorToString() { string fullText; if (text is CharArrayIterator) { CharArrayIterator charArrayIterator = (CharArrayIterator)text; fullText = new string(charArrayIterator.Text, charArrayIterator.Start, charArrayIterator.Length); } else { // TODO: is there a better way to extract full text from arbitrary CharacterIterators? StringBuilder builder = new StringBuilder(); for (char ch = text.First(); ch != CharacterIterator.Done; ch = text.Next()) { builder.Append(ch); } fullText = builder.ToString(); text.SetIndex(text.BeginIndex); } return(fullText); }
public virtual void TestSentenceInstance() { DoTests(CharArrayIterator.NewSentenceInstance()); }
public virtual void TestWordInstance() { DoTests(CharArrayIterator.NewWordInstance()); }
/* run this to test if your JRE is buggy * public void testSentenceInstanceJREBUG() { * // we use the default locale, as its randomized by LuceneTestCase * BreakIterator bi = BreakIterator.getSentenceInstance(Locale.getDefault()); * Segment ci = new Segment(); * for (int i = 0; i < 10000; i++) { * char text[] = TestUtil.randomUnicodeString(random).toCharArray(); * ci.array = text; * ci.offset = 0; * ci.count = text.length; * consume(bi, ci); * } * } */ private void DoTests(CharArrayIterator ci) { // basics ci.SetText("testing".ToCharArray(), 0, "testing".Length); assertEquals(0, ci.BeginIndex); assertEquals(7, ci.EndIndex); assertEquals(0, ci.Index); assertEquals('t', ci.Current()); assertEquals('e', ci.Next()); assertEquals('g', ci.Last()); assertEquals('n', ci.Previous()); assertEquals('t', ci.First()); assertEquals(CharacterIterator.DONE, ci.Previous()); // first() ci.SetText("testing".ToCharArray(), 0, "testing".Length); ci.Next(); // Sets the position to getBeginIndex() and returns the character at that position. assertEquals('t', ci.First()); assertEquals(ci.BeginIndex, ci.Index); // or DONE if the text is empty ci.SetText(new char[] { }, 0, 0); assertEquals(CharacterIterator.DONE, ci.First()); // last() ci.SetText("testing".ToCharArray(), 0, "testing".Length); // Sets the position to getEndIndex()-1 (getEndIndex() if the text is empty) // and returns the character at that position. assertEquals('g', ci.Last()); assertEquals(ci.Index, ci.EndIndex - 1); // or DONE if the text is empty ci.SetText(new char[] { }, 0, 0); assertEquals(CharacterIterator.DONE, ci.Last()); assertEquals(ci.EndIndex, ci.Index); // current() // Gets the character at the current position (as returned by getIndex()). ci.SetText("testing".ToCharArray(), 0, "testing".Length); assertEquals('t', ci.Current()); ci.Last(); ci.Next(); // or DONE if the current position is off the end of the text. assertEquals(CharacterIterator.DONE, ci.Current()); // next() ci.SetText("te".ToCharArray(), 0, 2); // Increments the iterator's index by one and returns the character at the new index. assertEquals('e', ci.Next()); assertEquals(1, ci.Index); // or DONE if the new position is off the end of the text range. assertEquals(CharacterIterator.DONE, ci.Next()); assertEquals(ci.EndIndex, ci.Index); // setIndex() ci.SetText("test".ToCharArray(), 0, "test".Length); try { ci.SetIndex(5); fail(); } catch (Exception e) { assertTrue(e is System.ArgumentException); } // clone() var text = "testing".ToCharArray(); ci.SetText(text, 0, text.Length); ci.Next(); var ci2 = ci.Clone() as CharArrayIterator; assertEquals(ci.Index, ci2.Index); assertEquals(ci.Next(), ci2.Next()); assertEquals(ci.Last(), ci2.Last()); }