ICU-8167 port BytesTrieTest to Java

X-SVN-Rev: 29279
This commit is contained in:
Markus Scherer 2011-01-10 21:23:38 +00:00
parent 4737659651
commit 045c005304
4 changed files with 762 additions and 6 deletions

View File

@ -384,7 +384,7 @@ public final class BytesTrie implements Cloneable, Iterable<BytesTrie.Entry> {
* @return A new BytesTrie.Iterator.
*/
public static Iterator iterator(byte[] trieBytes, int offset, int maxStringLength) {
return new Iterator(trieBytes, offset, -1, 0);
return new Iterator(trieBytes, offset, -1, maxStringLength);
}
/**
@ -395,12 +395,12 @@ public final class BytesTrie implements Cloneable, Iterable<BytesTrie.Entry> {
bytes=new byte[capacity];
}
public int stringLength() { return length; }
public int bytesLength() { return length; }
public byte byteAt(int index) { return bytes[index]; }
public void copyStringTo(byte[] dest, int destOffset) {
public void copyBytesTo(byte[] dest, int destOffset) {
System.arraycopy(bytes, 0, dest, destOffset, length);
}
public ByteBuffer stringAsByteBuffer() {
public ByteBuffer bytesAsByteBuffer() {
return ByteBuffer.wrap(bytes, 0, length).asReadOnlyBuffer();
}
@ -410,6 +410,7 @@ public final class BytesTrie implements Cloneable, Iterable<BytesTrie.Entry> {
if(bytes.length<len) {
byte[] newBytes=new byte[Math.min(2*bytes.length, 2*len)];
System.arraycopy(bytes, 0, newBytes, 0, length);
bytes=newBytes;
}
}
private void append(byte b) {

View File

@ -5,7 +5,7 @@
*******************************************************************************
* created on: 2011jan05
* created by: Markus W. Scherer
* ported from ICU4C bytestriebuilder/.cpp
* ported from ICU4C bytestriebuilder.h/.cpp
*/
package com.ibm.icu.impl;

View File

@ -5,7 +5,7 @@
*******************************************************************************
* created on: 2011jan05
* created by: Markus W. Scherer
* ported from ICU4C stringtriebuilder/.cpp
* ported from ICU4C stringtriebuilder.h/.cpp
*/
package com.ibm.icu.impl;
@ -26,6 +26,7 @@ public abstract class StringTrieBuilder {
protected final void createCompactBuilder(int sizeGuess) {
nodes=new HashMap<Node, Node>(sizeGuess);
lookupFinalValueNode=new FinalValueNode(0);
}
protected final void deleteCompactBuilder() {
nodes=null;

View File

@ -0,0 +1,754 @@
/*
*******************************************************************************
* Copyright (C) 2011, International Business Machines
* Corporation and others. All Rights Reserved.
*******************************************************************************
* created on: 2011jan08
* created by: Markus W. Scherer
* ported from ICU4C bytestrietest.h/.cpp
*/
package com.ibm.icu.dev.test.util;
import java.nio.ByteBuffer;
import java.util.NoSuchElementException;
import com.ibm.icu.dev.test.TestFmwk;
import com.ibm.icu.impl.BytesTrie;
import com.ibm.icu.impl.BytesTrieBuilder;
import com.ibm.icu.impl.StringTrieBuilder;
public class BytesTrieTest extends TestFmwk {
public static void main(String[] args) throws Exception {
new BytesTrieTest().run(args);
}
public BytesTrieTest() {}
// All test functions have a TestNN prefix where NN is a double-digit number.
// This is so that when tests are run in sorted order
// the simpler ones are run first.
// If there is a problem, the simpler ones are easier to step through.
public void Test00Builder() {
BytesTrieBuilder builder=new BytesTrieBuilder();
try {
builder.build(StringTrieBuilder.Option.FAST);
errln("BytesTrieBuilder().build() did not throw IndexOutOfBoundsException");
return;
} catch(IndexOutOfBoundsException e) {
// good
}
try {
byte[] equal=new byte[] { 0x3d }; // "="
builder.add(equal, 0, 0).add(equal, 0, 1).build(StringTrieBuilder.Option.FAST);
errln("BytesTrieBuilder.build() did not detect duplicates");
return;
} catch(IllegalArgumentException e) {
// good
}
}
private static final class StringAndValue {
public StringAndValue(String str, int val) {
s=str;
bytes=new byte[s.length()];
for(int i=0; i<bytes.length; ++i) {
bytes[i]=(byte)s.charAt(i);
}
value=val;
}
public String s;
public byte[] bytes;
public int value;
}
// Note: C++ StringAndValue initializers converted to Java syntax
// with Eclipse Find/Replace regular expressions:
// Find: \{ (".*", [-0-9xa-fA-F]+) \}
// Replace with: new StringAndValue($1)
public void Test10Empty() {
final StringAndValue[] data={
new StringAndValue("", 0)
};
checkData(data);
}
public void Test11_a() {
final StringAndValue[] data={
new StringAndValue("a", 1)
};
checkData(data);
}
public void Test12_a_ab() {
final StringAndValue[] data={
new StringAndValue("a", 1),
new StringAndValue("ab", 100)
};
checkData(data);
}
public void Test20ShortestBranch() {
final StringAndValue[] data={
new StringAndValue("a", 1000),
new StringAndValue("b", 2000)
};
checkData(data);
}
public void Test21Branches() {
final StringAndValue[] data={
new StringAndValue("a", 0x10),
new StringAndValue("cc", 0x40),
new StringAndValue("e", 0x100),
new StringAndValue("ggg", 0x400),
new StringAndValue("i", 0x1000),
new StringAndValue("kkkk", 0x4000),
new StringAndValue("n", 0x10000),
new StringAndValue("ppppp", 0x40000),
new StringAndValue("r", 0x100000),
new StringAndValue("sss", 0x200000),
new StringAndValue("t", 0x400000),
new StringAndValue("uu", 0x800000),
new StringAndValue("vv", 0x7fffffff),
new StringAndValue("zz", 0x80000000)
};
for(int length=2; length<=data.length; ++length) {
logln("TestBranches length="+length);
checkData(data, length);
}
}
public void Test22LongSequence() {
final StringAndValue[] data={
new StringAndValue("a", -1),
// sequence of linear-match nodes
new StringAndValue("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ", -2),
// more than 256 bytes
new StringAndValue(
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ"+
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ"+
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ"+
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ"+
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ"+
"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ", -3)
};
checkData(data);
}
public void Test23LongBranch() {
// Split-branch and interesting compact-integer values.
final StringAndValue[] data={
new StringAndValue("a", -2),
new StringAndValue("b", -1),
new StringAndValue("c", 0),
new StringAndValue("d2", 1),
new StringAndValue("f", 0x3f),
new StringAndValue("g", 0x40),
new StringAndValue("h", 0x41),
new StringAndValue("j23", 0x1900),
new StringAndValue("j24", 0x19ff),
new StringAndValue("j25", 0x1a00),
new StringAndValue("k2", 0x1a80),
new StringAndValue("k3", 0x1aff),
new StringAndValue("l234567890", 0x1b00),
new StringAndValue("l234567890123", 0x1b01),
new StringAndValue("nnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnnn", 0x10ffff),
new StringAndValue("oooooooooooooooooooooooooooooooooooooooooooooooooooooo", 0x110000),
new StringAndValue("pppppppppppppppppppppppppppppppppppppppppppppppppppppp", 0x120000),
new StringAndValue("r", 0x333333),
new StringAndValue("s2345", 0x4444444),
new StringAndValue("t234567890", 0x77777777),
new StringAndValue("z", 0x80000001)
};
checkData(data);
}
public void Test24ValuesForState() {
// Check that saveState() and resetToState() interact properly
// with next() and current().
final StringAndValue[] data={
new StringAndValue("a", -1),
new StringAndValue("ab", -2),
new StringAndValue("abc", -3),
new StringAndValue("abcd", -4),
new StringAndValue("abcde", -5),
new StringAndValue("abcdef", -6)
};
checkData(data);
}
public void Test30Compact() {
// Duplicate trailing strings and values provide opportunities for compacting.
final StringAndValue[] data={
new StringAndValue("+", 0),
new StringAndValue("+august", 8),
new StringAndValue("+december", 12),
new StringAndValue("+july", 7),
new StringAndValue("+june", 6),
new StringAndValue("+november", 11),
new StringAndValue("+october", 10),
new StringAndValue("+september", 9),
new StringAndValue("-", 0),
new StringAndValue("-august", 8),
new StringAndValue("-december", 12),
new StringAndValue("-july", 7),
new StringAndValue("-june", 6),
new StringAndValue("-november", 11),
new StringAndValue("-october", 10),
new StringAndValue("-september", 9),
// The l+n branch (with its sub-nodes) is a duplicate but will be written
// both times because each time it follows a different linear-match node.
new StringAndValue("xjuly", 7),
new StringAndValue("xjune", 6)
};
checkData(data);
}
public byte[] buildMonthsTrie(BytesTrieBuilder builder, StringTrieBuilder.Option buildOption) {
// All types of nodes leading to the same value,
// for code coverage of recursive functions.
// In particular, we need a lot of branches on some single level
// to exercise a split-branch node.
final StringAndValue[] data={
new StringAndValue("august", 8),
new StringAndValue("jan", 1),
new StringAndValue("jan.", 1),
new StringAndValue("jana", 1),
new StringAndValue("janbb", 1),
new StringAndValue("janc", 1),
new StringAndValue("janddd", 1),
new StringAndValue("janee", 1),
new StringAndValue("janef", 1),
new StringAndValue("janf", 1),
new StringAndValue("jangg", 1),
new StringAndValue("janh", 1),
new StringAndValue("janiiii", 1),
new StringAndValue("janj", 1),
new StringAndValue("jankk", 1),
new StringAndValue("jankl", 1),
new StringAndValue("jankmm", 1),
new StringAndValue("janl", 1),
new StringAndValue("janm", 1),
new StringAndValue("jannnnnnnnnnnnnnnnnnnnnnnnnnnnn", 1),
new StringAndValue("jano", 1),
new StringAndValue("janpp", 1),
new StringAndValue("janqqq", 1),
new StringAndValue("janr", 1),
new StringAndValue("januar", 1),
new StringAndValue("january", 1),
new StringAndValue("july", 7),
new StringAndValue("jun", 6),
new StringAndValue("jun.", 6),
new StringAndValue("june", 6)
};
return buildTrie(data, data.length, builder, buildOption);
}
public void Test40GetUniqueValue() {
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildMonthsTrie(builder, StringTrieBuilder.Option.FAST);
BytesTrie trie=new BytesTrie(trieBytes, 0);
long uniqueValue;
if((uniqueValue=trie.getUniqueValue())!=0) {
errln("unique value at root");
}
trie.next('j');
trie.next('a');
trie.next('n');
// hasUniqueValue() directly after next()
if((uniqueValue=trie.getUniqueValue())!=((1<<1)|1)) {
errln("not unique value 1 after \"jan\": instead "+uniqueValue);
}
trie.first('j');
trie.next('u');
if((uniqueValue=trie.getUniqueValue())!=0) {
errln("unique value after \"ju\"");
}
if(trie.next('n')!=BytesTrie.Result.INTERMEDIATE_VALUE || 6!=trie.getValue()) {
errln("not normal value 6 after \"jun\"");
}
// hasUniqueValue() after getValue()
if((uniqueValue=trie.getUniqueValue())!=((6<<1)|1)) {
errln("not unique value 6 after \"jun\"");
}
// hasUniqueValue() from within a linear-match node
trie.first('a');
trie.next('u');
if((uniqueValue=trie.getUniqueValue())!=((8<<1)|1)) {
errln("not unique value 8 after \"au\"");
}
}
public void Test41GetNextBytes() {
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildMonthsTrie(builder, StringTrieBuilder.Option.SMALL);
BytesTrie trie=new BytesTrie(trieBytes, 0);
StringBuilder buffer=new StringBuilder();
int count=trie.getNextBytes(buffer);
if(count!=2 || !"aj".contentEquals(buffer)) {
errln("months getNextBytes()!=[aj] at root");
}
trie.next('j');
trie.next('a');
trie.next('n');
// getNextBytes() directly after next()
buffer.setLength(0);
count=trie.getNextBytes(buffer);
if(count!=20 || !".abcdefghijklmnopqru".contentEquals(buffer)) {
errln("months getNextBytes()!=[.abcdefghijklmnopqru] after \"jan\"");
}
// getNextBytes() after getValue()
trie.getValue(); // next() had returned BytesTrie.Result.INTERMEDIATE_VALUE.
buffer.setLength(0);
count=trie.getNextBytes(buffer);
if(count!=20 || !".abcdefghijklmnopqru".contentEquals(buffer)) {
errln("months getNextBytes()!=[.abcdefghijklmnopqru] after \"jan\"+getValue()");
}
// getNextBytes() from a linear-match node
trie.next('u');
buffer.setLength(0);
count=trie.getNextBytes(buffer);
if(count!=1 || !"a".contentEquals(buffer)) {
errln("months getNextBytes()!=[a] after \"janu\"");
}
trie.next('a');
buffer.setLength(0);
count=trie.getNextBytes(buffer);
if(count!=1 || !"r".contentEquals(buffer)) {
errln("months getNextBytes()!=[r] after \"janua\"");
}
trie.next('r');
trie.next('y');
// getNextBytes() after a final match
buffer.setLength(0);
count=trie.getNextBytes(buffer);
if(count!=0 || buffer.length()!=0) {
errln("months getNextBytes()!=[] after \"january\"");
}
}
public void Test50IteratorFromBranch() {
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildMonthsTrie(builder, StringTrieBuilder.Option.FAST);
BytesTrie trie=new BytesTrie(trieBytes, 0);
// Go to a branch node.
trie.next('j');
trie.next('a');
trie.next('n');
BytesTrie.Iterator iter=trie.iterator();
// Expected data: Same as in buildMonthsTrie(), except only the suffixes
// following "jan".
final StringAndValue[] data={
new StringAndValue("", 1),
new StringAndValue(".", 1),
new StringAndValue("a", 1),
new StringAndValue("bb", 1),
new StringAndValue("c", 1),
new StringAndValue("ddd", 1),
new StringAndValue("ee", 1),
new StringAndValue("ef", 1),
new StringAndValue("f", 1),
new StringAndValue("gg", 1),
new StringAndValue("h", 1),
new StringAndValue("iiii", 1),
new StringAndValue("j", 1),
new StringAndValue("kk", 1),
new StringAndValue("kl", 1),
new StringAndValue("kmm", 1),
new StringAndValue("l", 1),
new StringAndValue("m", 1),
new StringAndValue("nnnnnnnnnnnnnnnnnnnnnnnnnnnn", 1),
new StringAndValue("o", 1),
new StringAndValue("pp", 1),
new StringAndValue("qqq", 1),
new StringAndValue("r", 1),
new StringAndValue("uar", 1),
new StringAndValue("uary", 1)
};
checkIterator(iter, data);
// Reset, and we should get the same result.
logln("after iter.reset()");
checkIterator(iter.reset(), data);
}
public void Test51IteratorFromLinearMatch() {
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildMonthsTrie(builder, StringTrieBuilder.Option.SMALL);
BytesTrie trie=new BytesTrie(trieBytes, 0);
// Go into a linear-match node.
trie.next('j');
trie.next('a');
trie.next('n');
trie.next('u');
trie.next('a');
BytesTrie.Iterator iter=trie.iterator();
// Expected data: Same as in buildMonthsTrie(), except only the suffixes
// following "janua".
final StringAndValue[] data={
new StringAndValue("r", 1),
new StringAndValue("ry", 1)
};
checkIterator(iter, data);
// Reset, and we should get the same result.
logln("after iter.reset()");
checkIterator(iter.reset(), data);
}
public void Test52TruncatingIteratorFromRoot() {
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildMonthsTrie(builder, StringTrieBuilder.Option.FAST);
BytesTrie.Iterator iter=BytesTrie.iterator(trieBytes, 0, 4);
// Expected data: Same as in buildMonthsTrie(), except only the first 4 characters
// of each string, and no string duplicates from the truncation.
final StringAndValue[] data={
new StringAndValue("augu", -1),
new StringAndValue("jan", 1),
new StringAndValue("jan.", 1),
new StringAndValue("jana", 1),
new StringAndValue("janb", -1),
new StringAndValue("janc", 1),
new StringAndValue("jand", -1),
new StringAndValue("jane", -1),
new StringAndValue("janf", 1),
new StringAndValue("jang", -1),
new StringAndValue("janh", 1),
new StringAndValue("jani", -1),
new StringAndValue("janj", 1),
new StringAndValue("jank", -1),
new StringAndValue("janl", 1),
new StringAndValue("janm", 1),
new StringAndValue("jann", -1),
new StringAndValue("jano", 1),
new StringAndValue("janp", -1),
new StringAndValue("janq", -1),
new StringAndValue("janr", 1),
new StringAndValue("janu", -1),
new StringAndValue("july", 7),
new StringAndValue("jun", 6),
new StringAndValue("jun.", 6),
new StringAndValue("june", 6)
};
checkIterator(iter, data);
// Reset, and we should get the same result.
logln("after iter.reset()");
checkIterator(iter.reset(), data);
}
public void Test53TruncatingIteratorFromLinearMatchShort() {
final StringAndValue[] data={
new StringAndValue("abcdef", 10),
new StringAndValue("abcdepq", 200),
new StringAndValue("abcdeyz", 3000)
};
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildTrie(data, data.length, builder, StringTrieBuilder.Option.FAST);
BytesTrie trie=new BytesTrie(trieBytes, 0);
// Go into a linear-match node.
trie.next('a');
trie.next('b');
// Truncate within the linear-match node.
BytesTrie.Iterator iter=trie.iterator(2);
final StringAndValue[] expected={
new StringAndValue("cd", -1)
};
checkIterator(iter, expected);
// Reset, and we should get the same result.
logln("after iter.reset()");
checkIterator(iter.reset(), expected);
}
public void Test54TruncatingIteratorFromLinearMatchLong() {
final StringAndValue[] data={
new StringAndValue("abcdef", 10),
new StringAndValue("abcdepq", 200),
new StringAndValue("abcdeyz", 3000)
};
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildTrie(data, data.length, builder, StringTrieBuilder.Option.FAST);
BytesTrie trie=new BytesTrie(trieBytes, 0);
// Go into a linear-match node.
trie.next('a');
trie.next('b');
trie.next('c');
// Truncate after the linear-match node.
BytesTrie.Iterator iter=trie.iterator(3);
final StringAndValue[] expected={
new StringAndValue("def", 10),
new StringAndValue("dep", -1),
new StringAndValue("dey", -1)
};
checkIterator(iter, expected);
// Reset, and we should get the same result.
logln("after iter.reset()");
checkIterator(iter.reset(), expected);
}
private void checkData(StringAndValue data[]) {
checkData(data, data.length);
}
private void checkData(StringAndValue data[], int dataLength) {
logln("checkData(dataLength="+dataLength+", fast)");
checkData(data, dataLength, StringTrieBuilder.Option.FAST);
logln("checkData(dataLength="+dataLength+", small)");
checkData(data, dataLength, StringTrieBuilder.Option.SMALL);
}
private void checkData(StringAndValue data[], int dataLength, StringTrieBuilder.Option buildOption) {
BytesTrieBuilder builder=new BytesTrieBuilder();
byte[] trieBytes=buildTrie(data, dataLength, builder, buildOption);
checkFirst(trieBytes, data, dataLength);
checkNext(trieBytes, data, dataLength);
checkNextWithState(trieBytes, data, dataLength);
checkNextString(trieBytes, data, dataLength);
checkIterator(trieBytes, data, dataLength);
}
private byte[] buildTrie(StringAndValue data[], int dataLength,
BytesTrieBuilder builder, StringTrieBuilder.Option buildOption) {
// Add the items to the trie builder in an interesting (not trivial, not random) order.
int index, step;
if((dataLength&1)!=0) {
// Odd number of items.
index=dataLength/2;
step=2;
} else if((dataLength%3)!=0) {
// Not a multiple of 3.
index=dataLength/5;
step=3;
} else {
index=dataLength-1;
step=-1;
}
builder.clear();
for(int i=0; i<dataLength; ++i) {
builder.add(data[index].bytes, data[index].bytes.length, data[index].value);
index=(index+step)%dataLength;
}
ByteBuffer result=builder.build(buildOption);
try {
builder.add(/* "zzz" */ new byte[] { 0x7a, 0x7a, 0x7a }, 0, 999);
errln("builder.build().add(zzz) did not throw IllegalStateException");
} catch(IllegalStateException e) {
// good
}
logln("serialized trie size: "+result.remaining()+" bytes\n");
byte[] trieBytes=new byte[result.remaining()];
result.get(trieBytes);
return trieBytes;
}
private void checkFirst(byte[] trieBytes, StringAndValue data[], int dataLength) {
BytesTrie trie=new BytesTrie(trieBytes, 0);
for(int i=0; i<dataLength; ++i) {
if(data[i].s.isEmpty()) {
continue; // skip empty string
}
int c=data[i].s.charAt(0);
BytesTrie.Result firstResult=trie.first(c);
int firstValue=firstResult.hasValue() ? trie.getValue() : -1;
int c1= data[i].s.length()>1 ? data[i].s.charAt(1) : 0;
BytesTrie.Result nextResult=trie.next(c1);
if(firstResult!=trie.reset().next(c) ||
firstResult!=trie.current() ||
firstValue!=(firstResult.hasValue() ? trie.getValue() : -1) ||
nextResult!=trie.next(c1)
) {
errln(String.format("trie.first(%c)!=trie.reset().next(same) for %s",
c, data[i].s));
}
}
}
private void checkNext(byte[] trieBytes, StringAndValue data[], int dataLength) {
BytesTrie trie=new BytesTrie(trieBytes, 0);
BytesTrie.State state=new BytesTrie.State();
for(int i=0; i<dataLength; ++i) {
int stringLength=data[i].s.length();
BytesTrie.Result result;
if( !(result=trie.next(data[i].bytes, 0, stringLength)).hasValue() ||
result!=trie.current()
) {
errln("trie does not seem to contain "+data[i].s);
} else if(trie.getValue()!=data[i].value) {
errln(String.format("trie value for %s is %d=0x%x instead of expected %d=0x%x",
data[i].s,
trie.getValue(), trie.getValue(),
data[i].value, data[i].value));
} else if(result!=trie.current() || trie.getValue()!=data[i].value) {
errln("trie value for "+data[i].s+" changes when repeating current()/getValue()");
}
trie.reset();
result=trie.current();
for(int j=0; j<stringLength; ++j) {
if(!result.hasNext()) {
errln(String.format("trie.current()!=hasNext before end of %s (at index %d)",
data[i].s, j));
break;
}
if(result==BytesTrie.Result.INTERMEDIATE_VALUE) {
trie.getValue();
if(trie.current()!=BytesTrie.Result.INTERMEDIATE_VALUE) {
errln(String.format("trie.getValue().current()!=BytesTrie.Result.INTERMEDIATE_VALUE "+
"before end of %s (at index %d)", data[i].s, j));
break;
}
}
result=trie.next(data[i].s.charAt(j));
if(!result.matches()) {
errln(String.format("trie.next()=BytesTrie.Result.NO_MATCH "+
"before end of %s (at index %d)", data[i].s, j));
break;
}
if(result!=trie.current()) {
errln(String.format("trie.next()!=following current() "+
"before end of %s (at index %d)", data[i].s, j));
break;
}
}
if(!result.hasValue()) {
errln("trie.next()!=hasValue at the end of "+data[i].s);
continue;
}
trie.getValue();
if(result!=trie.current()) {
errln("trie.current() != current()+getValue()+current() after end of "+
data[i].s);
}
// Compare the final current() with whether next() can actually continue.
trie.saveState(state);
boolean nextContinues=false;
for(int c=0x20; c<0x7f; ++c) {
if(trie.resetToState(state).next(c).matches()) {
nextContinues=true;
break;
}
}
if((result==BytesTrie.Result.INTERMEDIATE_VALUE)!=nextContinues) {
errln("(trie.current()==BytesTrie.Result.INTERMEDIATE_VALUE) contradicts "+
"(trie.next(some UChar)!=BytesTrie.Result.NO_MATCH) after end of "+data[i].s);
}
trie.reset();
}
}
private void checkNextWithState(byte[] trieBytes, StringAndValue data[], int dataLength) {
BytesTrie trie=new BytesTrie(trieBytes, 0);
BytesTrie.State noState=new BytesTrie.State(), state=new BytesTrie.State();
for(int i=0; i<dataLength; ++i) {
if((i&1)==0) {
try {
trie.resetToState(noState);
errln("trie.resetToState(noState) should throw an IllegalArgumentException");
} catch(IllegalArgumentException e) {
// good
}
}
byte[] expectedString=data[i].bytes;
int stringLength=data[i].s.length();
int partialLength=stringLength/3;
for(int j=0; j<partialLength; ++j) {
if(!trie.next(expectedString[j]).matches()) {
errln("trie.next()=BytesTrie.Result.NO_MATCH for a prefix of "+data[i].s);
return;
}
}
trie.saveState(state);
BytesTrie.Result resultAtState=trie.current();
BytesTrie.Result result;
int valueAtState=-99;
if(resultAtState.hasValue()) {
valueAtState=trie.getValue();
}
result=trie.next(0); // mismatch
if(result!=BytesTrie.Result.NO_MATCH || result!=trie.current()) {
errln("trie.next(0) matched after part of "+data[i].s);
}
if( resultAtState!=trie.resetToState(state).current() ||
(resultAtState.hasValue() && valueAtState!=trie.getValue())
) {
errln("trie.next(part of "+data[i].s+") changes current()/getValue() after "+
"saveState/next(0)/resetToState");
} else if(!(result=trie.next(expectedString, partialLength, stringLength)).hasValue() ||
result!=trie.current()) {
errln("trie.next(rest of "+data[i].s+") does not seem to contain "+data[i].s+" after "+
"saveState/next(0)/resetToState");
} else if(!(result=trie.resetToState(state).
next(expectedString, partialLength, stringLength)).hasValue() ||
result!=trie.current()) {
errln("trie does not seem to contain "+data[i].s+
" after saveState/next(rest)/resetToState");
} else if(trie.getValue()!=data[i].value) {
errln(String.format("trie value for %s is %d=0x%x instead of expected %d=0x%x",
data[i].s,
trie.getValue(), trie.getValue(),
data[i].value, data[i].value));
}
trie.reset();
}
}
// next(string) is also tested in other functions,
// but here we try to go partway through the string, and then beyond it.
private void checkNextString(byte[] trieBytes, StringAndValue data[], int dataLength) {
BytesTrie trie=new BytesTrie(trieBytes, 0);
for(int i=0; i<dataLength; ++i) {
byte[] expectedString=data[i].bytes;
int stringLength=data[i].s.length();
if(!trie.next(expectedString, 0, stringLength/2).matches()) {
errln("trie.next(up to middle of string)=BytesTrie.Result.NO_MATCH for "+data[i].s);
continue;
}
// Test that we stop properly at the end of the string.
trie.next(expectedString, stringLength/2, stringLength);
if(trie.next(0).matches()) {
errln("trie.next(string+NUL)!=BytesTrie.Result.NO_MATCH for "+data[i].s);
}
trie.reset();
}
}
private void checkIterator(byte[] trieBytes, StringAndValue data[], int dataLength) {
BytesTrie.Iterator iter=BytesTrie.iterator(trieBytes, 0, 0);
checkIterator(iter, data, dataLength);
}
private void checkIterator(BytesTrie.Iterator iter, StringAndValue data[]) {
checkIterator(iter, data, data.length);
}
private void checkIterator(BytesTrie.Iterator iter, StringAndValue data[], int dataLength) {
for(int i=0; i<dataLength; ++i) {
if(!iter.hasNext()) {
errln("trie iterator hasNext()=false for item "+i+": "+data[i].s);
break;
}
BytesTrie.Entry entry=iter.next();
StringBuilder bytesString=new StringBuilder();
for(int j=0; j<entry.bytesLength(); ++j) {
bytesString.append((char)(entry.byteAt(j)&0xff));
}
if(!data[i].s.contentEquals(bytesString)) {
errln(String.format("trie iterator next().getString()=%s but expected %s for item %d",
bytesString, data[i].s, i));
}
if(entry.value!=data[i].value) {
errln(String.format("trie iterator next().getValue()=%d=0x%x but expected %d=0x%x for item %d: %s",
entry.value, entry.value,
data[i].value, data[i].value,
i, data[i].s));
}
}
if(iter.hasNext()) {
errln("trie iterator hasNext()=true after all items");
}
try {
iter.next();
errln("trie iterator next() did not throw NoSuchElementException after all items");
} catch(NoSuchElementException e) {
// good
}
}
}