blob: c4f4c3443598c511fe72c35c284f6b45a7e9e42e [file] [log] [blame]
using J2N.Text;
//using Lucene.Net.Support;
using NUnit.Framework;
using System.Collections.Generic;
using System.Text;
using System.Text.RegularExpressions;
namespace Lucene.Net.Analysis.TokenAttributes
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* See the License for the specific language governing permissions and
* limitations under the License.
using BytesRef = Lucene.Net.Util.BytesRef;
using LuceneTestCase = Lucene.Net.Util.LuceneTestCase;
using TestUtil = Lucene.Net.Util.TestUtil;
public class TestCharTermAttributeImpl : LuceneTestCase
public virtual void TestResize()
CharTermAttribute t = new CharTermAttribute();
char[] content = "hello".ToCharArray();
t.CopyBuffer(content, 0, content.Length);
for (int i = 0; i < 2000; i++)
Assert.IsTrue(i <= t.Buffer.Length);
Assert.AreEqual("hello", t.ToString());
public virtual void TestGrow()
CharTermAttribute t = new CharTermAttribute();
StringBuilder buf = new StringBuilder("ab");
for (int i = 0; i < 20; i++)
char[] content = buf.ToString().ToCharArray();
t.CopyBuffer(content, 0, content.Length);
Assert.AreEqual(buf.Length, t.Length);
Assert.AreEqual(buf.ToString(), t.ToString());
Assert.AreEqual(1048576, t.Length);
// now as a StringBuilder, first variant
t = new CharTermAttribute();
buf = new StringBuilder("ab");
for (int i = 0; i < 20; i++)
Assert.AreEqual(buf.Length, t.Length);
Assert.AreEqual(buf.ToString(), t.ToString());
Assert.AreEqual(1048576, t.Length);
// Test for slow growth to a long term
t = new CharTermAttribute();
buf = new StringBuilder("a");
for (int i = 0; i < 20000; i++)
Assert.AreEqual(buf.Length, t.Length);
Assert.AreEqual(buf.ToString(), t.ToString());
Assert.AreEqual(20000, t.Length);
public virtual void TestToString()
char[] b = new char[] { 'a', 'l', 'o', 'h', 'a' };
CharTermAttribute t = new CharTermAttribute();
t.CopyBuffer(b, 0, 5);
Assert.AreEqual("aloha", t.ToString());
t.SetEmpty().Append("hi there");
Assert.AreEqual("hi there", t.ToString());
public virtual void TestClone()
CharTermAttribute t = new CharTermAttribute();
char[] content = "hello".ToCharArray();
t.CopyBuffer(content, 0, 5);
char[] buf = t.Buffer;
CharTermAttribute copy = TestToken.AssertCloneIsEqual(t);
Assert.AreEqual(t.ToString(), copy.ToString());
Assert.AreNotSame(buf, copy.Buffer);
public virtual void TestEquals()
CharTermAttribute t1a = new CharTermAttribute();
char[] content1a = "hello".ToCharArray();
t1a.CopyBuffer(content1a, 0, 5);
CharTermAttribute t1b = new CharTermAttribute();
char[] content1b = "hello".ToCharArray();
t1b.CopyBuffer(content1b, 0, 5);
CharTermAttribute t2 = new CharTermAttribute();
char[] content2 = "hello2".ToCharArray();
t2.CopyBuffer(content2, 0, 6);
public virtual void TestCopyTo()
CharTermAttribute t = new CharTermAttribute();
CharTermAttribute copy = TestToken.AssertCopyIsEqual(t);
Assert.AreEqual("", t.ToString());
Assert.AreEqual("", copy.ToString());
t = new CharTermAttribute();
char[] content = "hello".ToCharArray();
t.CopyBuffer(content, 0, 5);
char[] buf = t.Buffer;
copy = TestToken.AssertCopyIsEqual(t);
Assert.AreEqual(t.ToString(), copy.ToString());
Assert.AreNotSame(buf, copy.Buffer);
public virtual void TestAttributeReflection()
CharTermAttribute t = new CharTermAttribute();
TestUtil.AssertAttributeReflection(t, new Dictionary<string, object>()
{ typeof(ICharTermAttribute).Name + "#term", "foobar" },
{ typeof(ITermToBytesRefAttribute).Name + "#bytes", new BytesRef("foobar") }
public virtual void TestCharSequenceInterface()
const string s = "0123456789";
CharTermAttribute t = new CharTermAttribute();
Assert.AreEqual(s.Length, t.Length);
Assert.AreEqual("12", t.Subsequence(1, 3 - 1).ToString()); // LUCENENET: Corrected 2nd parameter of Subsequence
Assert.AreEqual(s, t.Subsequence(0, s.Length - 0).ToString()); // LUCENENET: Corrected 2nd parameter of Subsequence
Assert.IsTrue(Regex.IsMatch(t.ToString(), "01\\d+"));
Assert.IsTrue(Regex.IsMatch(t.Subsequence(3, 5 - 3).ToString(), "34")); // LUCENENET: Corrected 2nd parameter of Subsequence
Assert.AreEqual(s.Substring(3, 4), t.Subsequence(3, 7 - 3).ToString()); // LUCENENET: Corrected 2nd parameter of Subsequence
for (int i = 0; i < s.Length; i++)
Assert.IsTrue(t[i] == s[i]);
// LUCENENET specific to test indexer
for (int i = 0; i < s.Length; i++)
Assert.IsTrue(t[i] == s[i]);
public virtual void TestAppendableInterface()
CharTermAttribute t = new CharTermAttribute();
//Formatter formatter = new Formatter(t, Locale.ROOT);
//formatter.format("%d", 1234);
//Assert.AreEqual("1234", t.ToString());
//formatter.format("%d", 5678);
// LUCENENET: We don't have a formatter in .NET, so continue from here
t.Append("12345678"); // LUCENENET specific overload that accepts string
Assert.AreEqual("12345678", t.ToString());
t.SetEmpty().Append("12345678".ToCharArray()); // LUCENENET specific overload that accepts char[]
Assert.AreEqual("12345678", t.ToString());
Assert.AreEqual("123456789", t.ToString());
t.Append(new StringCharSequence("0"));
Assert.AreEqual("1234567890", t.ToString());
t.Append(new StringCharSequence("0123456789"), 1, 3 - 1); // LUCENENET: Corrected 3rd parameter
Assert.AreEqual("123456789012", t.ToString());
//t.Append((ICharSequence) CharBuffer.wrap("0123456789".ToCharArray()), 3, 5);
t.Append("0123456789".ToCharArray(), 3, 5 - 3); // LUCENENET: no CharBuffer in .NET, so we test char[], start, end overload // LUCENENET: Corrected 3rd parameter
Assert.AreEqual("12345678901234", t.ToString());
Assert.AreEqual("1234567890123412345678901234", t.ToString());
t.Append(/*(ICharSequence)*/ new StringBuilder("0123456789").ToString(), 5, 7 - 5); // LUCENENET: StringBuilder doesn't implement ICharSequence, corrected 3rd argument
Assert.AreEqual("123456789012341234567890123456", t.ToString());
t.Append(/*(ICharSequence)*/ new StringBuilder(t.ToString()));
Assert.AreEqual("123456789012341234567890123456123456789012341234567890123456", t.ToString()); // LUCENENET: StringBuilder doesn't implement ICharSequence
// very wierd, to test if a subSlice is wrapped correct :)
//CharBuffer buf = CharBuffer.wrap("0123456789".ToCharArray(), 3, 5); // LUCENENET: No CharBuffer in .NET
StringBuilder buf = new StringBuilder("0123456789", 3, 5, 16);
Assert.AreEqual("34567", buf.ToString());
t.SetEmpty().Append(/*(ICharSequence)*/ buf, 1, 2 - 1); // LUCENENET: StringBuilder doesn't implement ICharSequence // LUCENENET: Corrected 3rd parameter
Assert.AreEqual("4", t.ToString());
ICharTermAttribute t2 = new CharTermAttribute();
Assert.AreEqual("4test", t.ToString());
t.Append((ICharSequence)t2, 1, 2 - 1); // LUCENENET: Corrected 3rd parameter
Assert.AreEqual("4teste", t.ToString());
t.Append((ICharSequence)t2, 1, 5 - 1); // LUCENENET: Corrected 3rd parameter
Assert.Fail("Should throw ArgumentOutOfRangeException");
#pragma warning disable 168
catch (System.ArgumentOutOfRangeException iobe)
#pragma warning restore 168
t.Append((ICharSequence)t2, 1, 0 - 1); // LUCENENET: Corrected 3rd parameter
Assert.Fail("Should throw ArgumentOutOfRangeException");
#pragma warning disable 168
catch (System.ArgumentOutOfRangeException iobe)
#pragma warning restore 168
string expected = t.ToString();
t.Append((ICharSequence)null); // No-op
Assert.AreEqual(expected, t.ToString());
// LUCENENET specific - test string overloads
t.Append((string)t2.ToString(), 1, 5 - 1); // LUCENENET: Corrected 3rd parameter
Assert.Fail("Should throw ArgumentOutOfRangeException");
#pragma warning disable 168
catch (System.ArgumentOutOfRangeException iobe)
#pragma warning restore 168
t.Append((string)t2.ToString(), 1, 0 - 1); // LUCENENET: Corrected 3rd parameter
Assert.Fail("Should throw ArgumentOutOfRangeException");
#pragma warning disable 168
catch (System.ArgumentOutOfRangeException iobe)
#pragma warning restore 168
expected = t.ToString();
t.Append((string)null); // No-op
Assert.AreEqual(expected, t.ToString());
// LUCENENET specific - test char[] overloads
t.Append((char[])t2.ToString().ToCharArray(), 1, 5 - 1); // LUCENENET: Corrected 3rd parameter
Assert.Fail("Should throw ArgumentOutOfRangeException");
#pragma warning disable 168
catch (System.ArgumentOutOfRangeException iobe)
#pragma warning restore 168
t.Append((char[])t2.ToString().ToCharArray(), 1, 0 - 1); // LUCENENET: Corrected 3rd parameter
Assert.Fail("Should throw ArgumentOutOfRangeException");
#pragma warning disable 168
catch (System.ArgumentOutOfRangeException iobe)
#pragma warning restore 168
expected = t.ToString();
t.Append((char[])null); // No-op
Assert.AreEqual(expected, t.ToString());
public virtual void TestAppendableInterfaceWithLongSequences()
CharTermAttribute t = new CharTermAttribute();
t.Append("01234567890123456789012345678901234567890123456789"); // LUCENENET specific overload that accepts string
assertEquals("01234567890123456789012345678901234567890123456789", t.ToString());
t.Append("01234567890123456789012345678901234567890123456789", 3, 50 - 3); // LUCENENET specific overload that accepts string, startIndex, charCount
Assert.AreEqual("0123456789012345678901234567890123456789012345678934567890123456789012345678901234567890123456789", t.ToString());
t.Append("01234567890123456789012345678901234567890123456789".ToCharArray()); // LUCENENET specific overload that accepts char[]
assertEquals("01234567890123456789012345678901234567890123456789", t.ToString());
t.Append("01234567890123456789012345678901234567890123456789".ToCharArray(), 3, 50 - 3); // LUCENENET specific overload that accepts char[], startIndex, charCount
Assert.AreEqual("0123456789012345678901234567890123456789012345678934567890123456789012345678901234567890123456789", t.ToString());
t.Append(new StringCharSequence("01234567890123456789012345678901234567890123456789"));
//t.Append((ICharSequence) CharBuffer.wrap("01234567890123456789012345678901234567890123456789".ToCharArray()), 3, 50); // LUCENENET: No CharBuffer in .NET
t.Append("01234567890123456789012345678901234567890123456789".ToCharArray(), 3, 50 - 3); // LUCENENET specific overload that accepts char[], startIndex, charCount
// "01234567890123456789012345678901234567890123456789"
Assert.AreEqual("0123456789012345678901234567890123456789012345678934567890123456789012345678901234567890123456789", t.ToString());
t.SetEmpty().Append(/*(ICharSequence)*/ new StringBuilder("01234567890123456789"), 5, 17 - 5); // LUCENENET: StringBuilder doesn't implement ICharSequence
Assert.AreEqual(new StringCharSequence("567890123456"), t.ToString());
t.Append(new StringBuilder(t.ToString()));
Assert.AreEqual(new StringCharSequence("567890123456567890123456"), t.ToString());
// very wierd, to test if a subSlice is wrapped correct :)
//CharBuffer buf = CharBuffer.wrap("012345678901234567890123456789".ToCharArray(), 3, 15); // LUCENENET: No CharBuffer in .NET
StringBuilder buf = new StringBuilder("012345678901234567890123456789", 3, 15, 16);
Assert.AreEqual("345678901234567", buf.ToString());
t.SetEmpty().Append(buf, 1, 14 - 1);
Assert.AreEqual("4567890123456", t.ToString());
// finally use a completely custom ICharSequence that is not catched by instanceof checks
const string longTestString = "012345678901234567890123456789";
t.Append(new CharSequenceAnonymousInnerClassHelper(this, longTestString));
Assert.AreEqual("4567890123456" + longTestString, t.ToString());
private class CharSequenceAnonymousInnerClassHelper : ICharSequence
private readonly TestCharTermAttributeImpl OuterInstance;
private string LongTestString;
public CharSequenceAnonymousInnerClassHelper(TestCharTermAttributeImpl outerInstance, string longTestString)
this.OuterInstance = outerInstance;
this.LongTestString = longTestString;
bool ICharSequence.HasValue => LongTestString != null; // LUCENENET specific (implementation of ICharSequence)
public char CharAt(int i)
return LongTestString[i];
// LUCENENET specific - Added to .NETify
public char this[int i]
get { return LongTestString[i]; }
public int Length
return LongTestString.Length;
public ICharSequence Subsequence(int startIndex, int length) // LUCENENET: Changed semantics to startIndex/length to match .NET
return new StringCharSequence(LongTestString.Substring(startIndex, length));
public override string ToString()
return LongTestString;
public virtual void TestNonCharSequenceAppend()
CharTermAttribute t = new CharTermAttribute();
Assert.AreEqual("01234567890123456789", t.ToString());
t.Append(new StringBuilder("0123456789"));
Assert.AreEqual("012345678901234567890123456789", t.ToString());
ICharTermAttribute t2 = new CharTermAttribute();
Assert.AreEqual("012345678901234567890123456789test", t.ToString());
Assert.AreEqual("012345678901234567890123456789test", t.ToString());
public virtual void TestExceptions()
CharTermAttribute t = new CharTermAttribute();
Assert.AreEqual("test", t.ToString());
var _ = t[-1];
Assert.Fail("Should throw ArgumentOutOfRangeException");
catch (System.ArgumentOutOfRangeException)
var _ = t[4];
Assert.Fail("Should throw ArgumentOutOfRangeException");
catch (System.ArgumentOutOfRangeException)
t.Subsequence(0, 5 - 0); // LUCENENET: Corrected 2nd parameter of Subsequence
Assert.Fail("Should throw ArgumentOutOfRangeException");
catch (System.ArgumentOutOfRangeException)
t.Subsequence(5, 0 - 5); // LUCENENET: Corrected 2nd parameter of Subsequence
Assert.Fail("Should throw ArgumentOutOfRangeException");
catch (System.ArgumentOutOfRangeException)
// test speed of the dynamic instanceof checks in append(ICharSequence),
// to find the best max length for the generic while (start<end) loop:
public void testAppendPerf() {
CharTermAttributeImpl t = new CharTermAttributeImpl();
final int count = 32;
ICharSequence[] csq = new ICharSequence[count * 6];
final StringBuilder sb = new StringBuilder();
for (int i=0,j=0; i<count; i++) {
final String testString = sb.toString();
CharTermAttribute cta = new CharTermAttributeImpl();
csq[j++] = cta;
csq[j++] = testString;
csq[j++] = new StringBuilder(sb);
csq[j++] = new StringBuffer(sb);
csq[j++] = CharBuffer.wrap(testString.toCharArray());
csq[j++] = new ICharSequence() {
public char charAt(int i) { return testString.charAt(i); }
public int length() { return testString.length(); }
public ICharSequence subSequence(int start, int end) { return testString.subSequence(start, end); }
public String toString() { return testString; }
Random rnd = newRandom();
long startTime = System.currentTimeMillis();
for (int i=0; i<100000000; i++) {
long endTime = System.currentTimeMillis();
System.out.println("Time: " + (endTime-startTime)/1000.0 + " s");