blob: 0287a7ce53e70dcba4d877521610adf710a2ef3e [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.lucene.analysis.util;
import java.text.BreakIterator;
import java.text.CharacterIterator;
import java.util.Locale;
import org.apache.lucene.util.LuceneTestCase;
import org.apache.lucene.util.TestUtil;
public class TestCharArrayIterator extends LuceneTestCase {
public void testWordInstance() {
doTests(CharArrayIterator.newWordInstance());
}
public void testConsumeWordInstance() {
// we use the default locale, as it's randomized by LuceneTestCase
BreakIterator bi = BreakIterator.getWordInstance(Locale.getDefault());
CharArrayIterator ci = CharArrayIterator.newWordInstance();
for (int i = 0; i < 10000; i++) {
char text[] = TestUtil.randomUnicodeString(random()).toCharArray();
ci.setText(text, 0, text.length);
consume(bi, ci);
}
}
/* run this to test if your JRE is buggy
public void testWordInstanceJREBUG() {
// we use the default locale, as it's randomized by LuceneTestCase
BreakIterator bi = BreakIterator.getWordInstance(Locale.getDefault());
Segment ci = new Segment();
for (int i = 0; i < 10000; i++) {
char text[] = _TestUtil.randomUnicodeString(random).toCharArray();
ci.array = text;
ci.offset = 0;
ci.count = text.length;
consume(bi, ci);
}
}
*/
public void testSentenceInstance() {
doTests(CharArrayIterator.newSentenceInstance());
}
public void testConsumeSentenceInstance() {
// we use the default locale, as it's randomized by LuceneTestCase
BreakIterator bi = BreakIterator.getSentenceInstance(Locale.getDefault());
CharArrayIterator ci = CharArrayIterator.newSentenceInstance();
for (int i = 0; i < 10000; i++) {
char text[] = TestUtil.randomUnicodeString(random()).toCharArray();
ci.setText(text, 0, text.length);
consume(bi, ci);
}
}
/* run this to test if your JRE is buggy
public void testSentenceInstanceJREBUG() {
// we use the default locale, as it's randomized by LuceneTestCase
BreakIterator bi = BreakIterator.getSentenceInstance(Locale.getDefault());
Segment ci = new Segment();
for (int i = 0; i < 10000; i++) {
char text[] = _TestUtil.randomUnicodeString(random).toCharArray();
ci.array = text;
ci.offset = 0;
ci.count = text.length;
consume(bi, ci);
}
}
*/
private void doTests(CharArrayIterator ci) {
// basics
ci.setText("testing".toCharArray(), 0, "testing".length());
assertEquals(0, ci.getBeginIndex());
assertEquals(7, ci.getEndIndex());
assertEquals(0, ci.getIndex());
assertEquals('t', ci.current());
assertEquals('e', ci.next());
assertEquals('g', ci.last());
assertEquals('n', ci.previous());
assertEquals('t', ci.first());
assertEquals(CharacterIterator.DONE, ci.previous());
// first()
ci.setText("testing".toCharArray(), 0, "testing".length());
ci.next();
// Sets the position to getBeginIndex() and returns the character at that position.
assertEquals('t', ci.first());
assertEquals(ci.getBeginIndex(), ci.getIndex());
// or DONE if the text is empty
ci.setText(new char[] {}, 0, 0);
assertEquals(CharacterIterator.DONE, ci.first());
// last()
ci.setText("testing".toCharArray(), 0, "testing".length());
// Sets the position to getEndIndex()-1 (getEndIndex() if the text is empty)
// and returns the character at that position.
assertEquals('g', ci.last());
assertEquals(ci.getIndex(), ci.getEndIndex() - 1);
// or DONE if the text is empty
ci.setText(new char[] {}, 0, 0);
assertEquals(CharacterIterator.DONE, ci.last());
assertEquals(ci.getEndIndex(), ci.getIndex());
// current()
// Gets the character at the current position (as returned by getIndex()).
ci.setText("testing".toCharArray(), 0, "testing".length());
assertEquals('t', ci.current());
ci.last();
ci.next();
// or DONE if the current position is off the end of the text.
assertEquals(CharacterIterator.DONE, ci.current());
// next()
ci.setText("te".toCharArray(), 0, 2);
// Increments the iterator's index by one and returns the character at the new index.
assertEquals('e', ci.next());
assertEquals(1, ci.getIndex());
// or DONE if the new position is off the end of the text range.
assertEquals(CharacterIterator.DONE, ci.next());
assertEquals(ci.getEndIndex(), ci.getIndex());
// setIndex()
ci.setText("test".toCharArray(), 0, "test".length());
expectThrows(IllegalArgumentException.class, () -> {
ci.setIndex(5);
});
// clone()
char text[] = "testing".toCharArray();
ci.setText(text, 0, text.length);
ci.next();
CharArrayIterator ci2 = ci.clone();
assertEquals(ci.getIndex(), ci2.getIndex());
assertEquals(ci.next(), ci2.next());
assertEquals(ci.last(), ci2.last());
}
private void consume(BreakIterator bi, CharacterIterator ci) {
bi.setText(ci);
while (bi.next() != BreakIterator.DONE)
;
}
}