lucene/analysis/common/src/test/org/apache/lucene/analysis/util/TestCharArrayIterator.java - lucene-solr - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.lucene.analysis.util;


 import java.text.BreakIterator;
 import java.text.CharacterIterator;
 import java.util.Locale;

 import org.apache.lucene.util.LuceneTestCase;
 import org.apache.lucene.util.TestUtil;

 public class TestCharArrayIterator extends LuceneTestCase {

   public void testWordInstance() {
     doTests(CharArrayIterator.newWordInstance());
   }

   public void testConsumeWordInstance() {
     // we use the default locale, as it's randomized by LuceneTestCase
     BreakIterator bi = BreakIterator.getWordInstance(Locale.getDefault());
     CharArrayIterator ci = CharArrayIterator.newWordInstance();
     for (int i = 0; i < 10000; i++) {
       char text[] = TestUtil.randomUnicodeString(random()).toCharArray();
       ci.setText(text, 0, text.length);
       consume(bi, ci);
     }
   }

   /* run this to test if your JRE is buggy
   public void testWordInstanceJREBUG() {
     // we use the default locale, as it's randomized by LuceneTestCase
     BreakIterator bi = BreakIterator.getWordInstance(Locale.getDefault());
     Segment ci = new Segment();
     for (int i = 0; i < 10000; i++) {
       char text[] = _TestUtil.randomUnicodeString(random).toCharArray();
       ci.array = text;
       ci.offset = 0;
       ci.count = text.length;
       consume(bi, ci);
     }
   }
   */

   public void testSentenceInstance() {
     doTests(CharArrayIterator.newSentenceInstance());
   }

   public void testConsumeSentenceInstance() {
     // we use the default locale, as it's randomized by LuceneTestCase
     BreakIterator bi = BreakIterator.getSentenceInstance(Locale.getDefault());
     CharArrayIterator ci = CharArrayIterator.newSentenceInstance();
     for (int i = 0; i < 10000; i++) {
       char text[] = TestUtil.randomUnicodeString(random()).toCharArray();
       ci.setText(text, 0, text.length);
       consume(bi, ci);
     }
   }

   /* run this to test if your JRE is buggy
   public void testSentenceInstanceJREBUG() {
     // we use the default locale, as it's randomized by LuceneTestCase
     BreakIterator bi = BreakIterator.getSentenceInstance(Locale.getDefault());
     Segment ci = new Segment();
     for (int i = 0; i < 10000; i++) {
       char text[] = _TestUtil.randomUnicodeString(random).toCharArray();
       ci.array = text;
       ci.offset = 0;
       ci.count = text.length;
       consume(bi, ci);
     }
   }
   */

   private void doTests(CharArrayIterator ci) {
     // basics
     ci.setText("testing".toCharArray(), 0, "testing".length());
     assertEquals(0, ci.getBeginIndex());
     assertEquals(7, ci.getEndIndex());
     assertEquals(0, ci.getIndex());
     assertEquals('t', ci.current());
     assertEquals('e', ci.next());
     assertEquals('g', ci.last());
     assertEquals('n', ci.previous());
     assertEquals('t', ci.first());
     assertEquals(CharacterIterator.DONE, ci.previous());

     // first()
     ci.setText("testing".toCharArray(), 0, "testing".length());
     ci.next();
     // Sets the position to getBeginIndex() and returns the character at that position.
     assertEquals('t', ci.first());
     assertEquals(ci.getBeginIndex(), ci.getIndex());
     // or DONE if the text is empty
     ci.setText(new char[] {}, 0, 0);
     assertEquals(CharacterIterator.DONE, ci.first());

     // last()
     ci.setText("testing".toCharArray(), 0, "testing".length());
     // Sets the position to getEndIndex()-1 (getEndIndex() if the text is empty)
     // and returns the character at that position.
     assertEquals('g', ci.last());
     assertEquals(ci.getIndex(), ci.getEndIndex() - 1);
     // or DONE if the text is empty
     ci.setText(new char[] {}, 0, 0);
     assertEquals(CharacterIterator.DONE, ci.last());
     assertEquals(ci.getEndIndex(), ci.getIndex());

     // current()
     // Gets the character at the current position (as returned by getIndex()).
     ci.setText("testing".toCharArray(), 0, "testing".length());
     assertEquals('t', ci.current());
     ci.last();
     ci.next();
     // or DONE if the current position is off the end of the text.
     assertEquals(CharacterIterator.DONE, ci.current());

     // next()
     ci.setText("te".toCharArray(), 0, 2);
     // Increments the iterator's index by one and returns the character at the new index.
     assertEquals('e', ci.next());
     assertEquals(1, ci.getIndex());
     // or DONE if the new position is off the end of the text range.
     assertEquals(CharacterIterator.DONE, ci.next());
     assertEquals(ci.getEndIndex(), ci.getIndex());

     // setIndex()
     ci.setText("test".toCharArray(), 0, "test".length());
     expectThrows(IllegalArgumentException.class, () -> {
       ci.setIndex(5);
     });

     // clone()
     char text[] = "testing".toCharArray();
     ci.setText(text, 0, text.length);
     ci.next();
     CharArrayIterator ci2 = ci.clone();
     assertEquals(ci.getIndex(), ci2.getIndex());
     assertEquals(ci.next(), ci2.next());
     assertEquals(ci.last(), ci2.last());
   }

   private void consume(BreakIterator bi, CharacterIterator ci) {
     bi.setText(ci);
     while (bi.next() != BreakIterator.DONE)
       ;
   }
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package org.apache.lucene.analysis.util;


	import java.text.BreakIterator;
	import java.text.CharacterIterator;
	import java.util.Locale;

	import org.apache.lucene.util.LuceneTestCase;
	import org.apache.lucene.util.TestUtil;

	public class TestCharArrayIterator extends LuceneTestCase {

	public void testWordInstance() {
	doTests(CharArrayIterator.newWordInstance());
	}

	public void testConsumeWordInstance() {
	// we use the default locale, as it's randomized by LuceneTestCase
	BreakIterator bi = BreakIterator.getWordInstance(Locale.getDefault());
	CharArrayIterator ci = CharArrayIterator.newWordInstance();
	for (int i = 0; i < 10000; i++) {
	char text[] = TestUtil.randomUnicodeString(random()).toCharArray();
	ci.setText(text, 0, text.length);
	consume(bi, ci);
	}
	}

	/* run this to test if your JRE is buggy
	public void testWordInstanceJREBUG() {
	// we use the default locale, as it's randomized by LuceneTestCase
	BreakIterator bi = BreakIterator.getWordInstance(Locale.getDefault());
	Segment ci = new Segment();
	for (int i = 0; i < 10000; i++) {
	char text[] = _TestUtil.randomUnicodeString(random).toCharArray();
	ci.array = text;
	ci.offset = 0;
	ci.count = text.length;
	consume(bi, ci);
	}
	}
	*/

	public void testSentenceInstance() {
	doTests(CharArrayIterator.newSentenceInstance());
	}

	public void testConsumeSentenceInstance() {
	// we use the default locale, as it's randomized by LuceneTestCase
	BreakIterator bi = BreakIterator.getSentenceInstance(Locale.getDefault());
	CharArrayIterator ci = CharArrayIterator.newSentenceInstance();
	for (int i = 0; i < 10000; i++) {
	char text[] = TestUtil.randomUnicodeString(random()).toCharArray();
	ci.setText(text, 0, text.length);
	consume(bi, ci);
	}
	}

	/* run this to test if your JRE is buggy
	public void testSentenceInstanceJREBUG() {
	// we use the default locale, as it's randomized by LuceneTestCase
	BreakIterator bi = BreakIterator.getSentenceInstance(Locale.getDefault());
	Segment ci = new Segment();
	for (int i = 0; i < 10000; i++) {
	char text[] = _TestUtil.randomUnicodeString(random).toCharArray();
	ci.array = text;
	ci.offset = 0;
	ci.count = text.length;
	consume(bi, ci);
	}
	}
	*/

	private void doTests(CharArrayIterator ci) {
	// basics
	ci.setText("testing".toCharArray(), 0, "testing".length());
	assertEquals(0, ci.getBeginIndex());
	assertEquals(7, ci.getEndIndex());
	assertEquals(0, ci.getIndex());
	assertEquals('t', ci.current());
	assertEquals('e', ci.next());
	assertEquals('g', ci.last());
	assertEquals('n', ci.previous());
	assertEquals('t', ci.first());
	assertEquals(CharacterIterator.DONE, ci.previous());

	// first()
	ci.setText("testing".toCharArray(), 0, "testing".length());
	ci.next();
	// Sets the position to getBeginIndex() and returns the character at that position.
	assertEquals('t', ci.first());
	assertEquals(ci.getBeginIndex(), ci.getIndex());
	// or DONE if the text is empty
	ci.setText(new char[] {}, 0, 0);
	assertEquals(CharacterIterator.DONE, ci.first());

	// last()
	ci.setText("testing".toCharArray(), 0, "testing".length());
	// Sets the position to getEndIndex()-1 (getEndIndex() if the text is empty)
	// and returns the character at that position.
	assertEquals('g', ci.last());
	assertEquals(ci.getIndex(), ci.getEndIndex() - 1);
	// or DONE if the text is empty
	ci.setText(new char[] {}, 0, 0);
	assertEquals(CharacterIterator.DONE, ci.last());
	assertEquals(ci.getEndIndex(), ci.getIndex());

	// current()
	// Gets the character at the current position (as returned by getIndex()).
	ci.setText("testing".toCharArray(), 0, "testing".length());
	assertEquals('t', ci.current());
	ci.last();
	ci.next();
	// or DONE if the current position is off the end of the text.
	assertEquals(CharacterIterator.DONE, ci.current());

	// next()
	ci.setText("te".toCharArray(), 0, 2);
	// Increments the iterator's index by one and returns the character at the new index.
	assertEquals('e', ci.next());
	assertEquals(1, ci.getIndex());
	// or DONE if the new position is off the end of the text range.
	assertEquals(CharacterIterator.DONE, ci.next());
	assertEquals(ci.getEndIndex(), ci.getIndex());

	// setIndex()
	ci.setText("test".toCharArray(), 0, "test".length());
	expectThrows(IllegalArgumentException.class, () -> {
	ci.setIndex(5);
	});

	// clone()
	char text[] = "testing".toCharArray();
	ci.setText(text, 0, text.length);
	ci.next();
	CharArrayIterator ci2 = ci.clone();
	assertEquals(ci.getIndex(), ci2.getIndex());
	assertEquals(ci.next(), ci2.next());
	assertEquals(ci.last(), ci2.last());
	}

	private void consume(BreakIterator bi, CharacterIterator ci) {
	bi.setText(ci);
	while (bi.next() != BreakIterator.DONE)
	;
	}
	}