blob: 9a8dc1f8a9a27e52fcc42905e237f913a0cc27f6 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.datasketches.hll;
import static org.apache.datasketches.hll.CurMode.LIST;
import static org.apache.datasketches.hll.CurMode.SET;
import static org.apache.datasketches.hll.HllUtil.HLL_HIP_RSE_FACTOR;
import static org.apache.datasketches.hll.HllUtil.HLL_NON_HIP_RSE_FACTOR;
import static org.apache.datasketches.hll.TgtHllType.HLL_4;
import static org.apache.datasketches.hll.TgtHllType.HLL_6;
import static org.apache.datasketches.hll.TgtHllType.HLL_8;
import static org.testng.Assert.assertEquals;
import static org.testng.Assert.assertFalse;
import static org.testng.Assert.assertTrue;
import org.apache.datasketches.SketchesStateException;
import org.apache.datasketches.memory.WritableMemory;
import org.testng.annotations.Test;
/**
* @author Lee Rhodes
*/
@SuppressWarnings("javadoc")
public class UnionCaseTest {
private static final String LS = System.getProperty("line.separator");
long v = 0;
final static int maxLgK = 12;
HllSketch source;
//Union union;
String hfmt = "%10s%10s%10s%10s%10s%10s%10s%10s%10s%10s%10s" + LS;
String hdr = String.format(hfmt, "caseNum","srcLgKStr","gdtLgKStr","srcType","gdtType",
"srcMem","gdtMem","srcMode","gdtMode","srcOoof","gdtOoof");
@Test
public void checkAllCases() {
print(hdr);
for (int i = 0; i < 24; i++) {
checkCase(i, HLL_4, false);
}
println("");
print(hdr);
for (int i = 0; i < 24; i++) {
checkCase(i, HLL_6, false);
}
println("");
print(hdr);
for (int i = 0; i < 24; i++) {
checkCase(i, HLL_8, false);
}
println("");
print(hdr);
for (int i = 0; i < 24; i++) {
checkCase(i, HLL_4, true);
}
println("");
print(hdr);
for (int i = 0; i < 24; i++) {
checkCase(i, HLL_6, true);
}
println("");
print(hdr);
for (int i = 0; i < 24; i++) {
checkCase(i, HLL_8, true);
}
println("");
}
private void checkCase(int caseNum, TgtHllType srcType, boolean srcMem) {
source = getSource(caseNum, srcType, srcMem);
boolean gdtMem = (caseNum & 1) > 0;
Union union = getUnion(caseNum, gdtMem);
union.update(source);
int totalU = getSrcCount(caseNum, maxLgK) + getUnionCount(caseNum);
output(caseNum, source, union, totalU);
}
private void output(int caseNum, HllSketch source, Union union, int totalU) {
double estU = union.getEstimate();
double err = Math.abs((estU / totalU) - 1.0);
int gdtLgK = union.getLgConfigK();
boolean uooof = union.isOutOfOrder();
double rseFactor = (uooof) ? HLL_NON_HIP_RSE_FACTOR : HLL_HIP_RSE_FACTOR;
double rse = (rseFactor * 3) / Math.sqrt(1 << gdtLgK); //99.7% conf
//output other parameters
String caseNumStr = Integer.toString(caseNum);
String srcLgKStr = Integer.toString(source.getLgConfigK());
String gdtLgKStr = Integer.toString(union.getLgConfigK());
String srcType = source.getTgtHllType().toString();
String gdtType = union.getTgtHllType().toString();
String srcMem = Boolean.toString(source.isMemory());
String gdtMem = Boolean.toString(union.isMemory());
String srcMode = source.getCurMode().toString();
String gdtMode = union.getCurMode().toString();
String srcOoof = Boolean.toString(source.isOutOfOrder());
String gdtOoof = Boolean.toString(union.isOutOfOrder());
printf(hfmt, caseNumStr, srcLgKStr, gdtLgKStr, srcType, gdtType, srcMem, gdtMem,
srcMode, gdtMode, srcOoof, gdtOoof);
assertTrue(err < rse, "Err: " + err + ", RSE: " + rse);
}
private HllSketch getSource(int caseNum, TgtHllType tgtHllType, boolean memory) {
int srcLgK = getSrcLgK(caseNum, maxLgK);
int srcU = getSrcCount(caseNum, maxLgK);
if (memory) {
return buildMemorySketch(srcLgK, tgtHllType, srcU);
} else {
return buildHeapSketch(srcLgK, tgtHllType, srcU);
}
}
private Union getUnion(int caseNum, boolean memory) {
int unionU = getUnionCount(caseNum);
return (memory) ? buildMemoryUnion(maxLgK, unionU) : buildHeapUnion(maxLgK, unionU);
}
private static int getUnionCount(int caseNum) {
int gdtMode = (caseNum >> 1) & 3; //list, set, hll, empty
return (gdtMode == 0) ? 4 : (gdtMode == 1) ? 380 : (gdtMode == 2) ? 400 : 0;
}
private static int getSrcCount(int caseNum, int maxLgK) {
int srcLgK = getSrcLgK(caseNum, maxLgK);
return (((1 << srcLgK) * 3) / 4) + 100; //always HLL
}
private static int getSrcLgK(int caseNum, int maxLgK) {
int srcLgK = maxLgK;
int bits34 = (caseNum >> 3) & 3;
if (bits34 == 1) { srcLgK = maxLgK - 1;}
if (bits34 == 2) { srcLgK = maxLgK + 1;}
return srcLgK;
}
@Test
public void checkMisc() {
Union u = buildHeapUnion(12, 0);
int bytes = u.getCompactSerializationBytes();
assertEquals(bytes, 8);
bytes = Union.getMaxSerializationBytes(7);
assertEquals(bytes, 40 + 128);
double v = u.getEstimate();
assertEquals(v, 0.0, 0.0);
v = u.getLowerBound(1);
assertEquals(v, 0.0, 0.0);
v = u.getUpperBound(1);
assertEquals(v, 0.0, 0.0);
assertTrue(u.isEmpty());
u.reset();
assertTrue(u.isEmpty());
println(u.toString(true, false, false, false));
byte[] bArr = u.toCompactByteArray();
assertEquals(bArr.length, 8);
}
@Test
public void checkSrcListList() { //src: LIST, gadget: LIST
int n1 = 2;
int n2 = 3;
int n3 = 2;
int sum = n1 + n2 + n3;
Union u = buildHeapUnion(12, n1); //gdt = list
HllSketch h2 = buildHeapSketch(11, HLL_6, n2); //src = list
HllSketch h3 = buildHeapSketch(10, HLL_8, n3); //src = list
u.update(h2);
println(u.toString());
assertEquals(u.getCurMode(), LIST);
u.update(h3);
println(u.toString());
assertEquals(u.getCurMode(), LIST);
assertEquals(u.getLgConfigK(), 12);
assertFalse(u.isOutOfOrder());
double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrder(), 3.0);
println("ErrToll: " + err);
assertEquals(u.getEstimate(), sum, err);
}
@Test
public void checkSrcListSet() { //src: SET, gadget: LIST
int n1 = 5;
int n2 = 2;
int n3 = 16;
int sum = n1 + n2 + n3;
Union u = buildHeapUnion(12, n1); //LIST, 5
HllSketch h2 = buildHeapSketch(11, HLL_6, n2); //LIST, 2
HllSketch h3 = buildHeapSketch(10, HLL_8, n3); //SET, 16
u.update(h2);
println(u.toString());
assertEquals(u.getCurMode(), LIST);
u.update(h3);
println(u.toString());
assertEquals(u.getCurMode(), SET);
assertEquals(u.getLgConfigK(), 12);
assertFalse(u.isOutOfOrder());
double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrder(), 3.0);
println("ErrToll: " + err);
assertEquals(u.getEstimate(), sum, err);
}
@Test
public void checkSrcSetList() { //src: LIST, gadget: SET
int n1 = 6;
int n2 = 10;
int n3 = 6;
int sum = n1 + n2 + n3;
Union u = buildHeapUnion(12, n1);
HllSketch h2 = buildHeapSketch(11, HLL_6, n2); //SET
HllSketch h3 = buildHeapSketch(10, HLL_8, n3); //LIST
u.update(h2);
println(u.toString());
assertEquals(u.getCurMode(), SET);
u.update(h3);
println(u.toString());
assertEquals(u.getCurMode(), SET);
assertEquals(u.getLgConfigK(), 12);
assertFalse(u.isOutOfOrder());
double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrder(), 3.0);
println("ErrToll: " + err);
assertEquals(u.getEstimate(), sum, err);
}
@Test
public void checkSrcSetSet() { //src: SET, gadget: SET
int n1 = 6;
int n2 = 10;
int n3 = 16;
int sum = n1 + n2 + n3;
Union u = buildHeapUnion(12, n1);
HllSketch h2 = buildHeapSketch(11, HLL_6, n2); //src: SET
HllSketch h3 = buildHeapSketch(10, HLL_8, n3); //src: SET
u.update(h2);
println(u.toString());
assertEquals(u.getCurMode(), SET);
u.update(h3);
println(u.toString());
assertEquals(u.getCurMode(), SET);
assertEquals(u.getLgConfigK(), 12);
assertFalse(u.isOutOfOrder());
double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrder(), 3.0);
println("ErrToll: " + err);
assertEquals(u.getEstimate(), sum, err);
}
@Test
public void checkSrcEmptyList() { //src: LIST, gadget: empty
int n1 = 0;
int n2 = 0;
int n3 = 7;
int sum = n1 + n2 + n3;
Union u = buildHeapUnion(12, n1); //LIST empty
HllSketch h2 = buildHeapSketch(11, HLL_6, n2); //src: LIST empty, ignored
HllSketch h3 = buildHeapSketch(10, HLL_8, n3); //src: LIST
u.update(h2);
println(u.toString());
assertEquals(u.getCurMode(), LIST);
u.update(h3);
println(u.toString());
assertEquals(u.getCurMode(), LIST);
assertEquals(u.getLgConfigK(), 12);
assertFalse(u.isOutOfOrder());
double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrder(), 3.0);
println("ErrToll: " + err);
assertEquals(u.getEstimate(), sum, err);
}
@Test
public void checkSrcEmptySet() {
int n1 = 0;
int n2 = 0;
int n3 = 16;
int sum = n1 + n2 + n3;
Union u = buildHeapUnion(12, n1); //LIST empty
HllSketch h2 = buildHeapSketch(11, HLL_6, n2); //LIST empty, ignored
HllSketch h3 = buildHeapSketch(10, HLL_8, n3); // Src Set
u.update(h2);
println(u.toString());
assertEquals(u.getCurMode(), LIST);
u.update(h3);
println(u.toString());
assertEquals(u.getCurMode(), SET);
assertEquals(u.getLgConfigK(), 12);
assertFalse(u.isOutOfOrder());
double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrder(), 3.0);
println("ErrToll: " + err);
assertEquals(u.getEstimate(), sum, err);
}
@SuppressWarnings("unused")
@Test
public void checkSpecialMergeCase4() {
Union u = buildHeapUnion(12, 1 << 9);
HllSketch sk = buildHeapSketch(12, HLL_8, 1 << 9);
u.update(sk);
assertTrue(u.isRebuildCurMinNumKxQFlag());
u.getCompositeEstimate();
assertFalse(u.isRebuildCurMinNumKxQFlag());
u.update(sk);
assertTrue(u.isRebuildCurMinNumKxQFlag());
u.getLowerBound(2);
assertFalse(u.isRebuildCurMinNumKxQFlag());
u.update(sk);
assertTrue(u.isRebuildCurMinNumKxQFlag());
u.getUpperBound(2);
assertFalse(u.isRebuildCurMinNumKxQFlag());
u.update(sk);
assertTrue(u.isRebuildCurMinNumKxQFlag());
u.getResult();
assertFalse(u.isRebuildCurMinNumKxQFlag());
u.update(sk);
assertTrue(u.isRebuildCurMinNumKxQFlag());
byte[] ba = u.toCompactByteArray();
assertFalse(u.isRebuildCurMinNumKxQFlag());
u.update(sk);
assertTrue(u.isRebuildCurMinNumKxQFlag());
ba = u.toUpdatableByteArray();
assertFalse(u.isRebuildCurMinNumKxQFlag());
u.putRebuildCurMinNumKxQFlag(true);
assertTrue(u.isRebuildCurMinNumKxQFlag());
u.putRebuildCurMinNumKxQFlag(false);
assertFalse(u.isRebuildCurMinNumKxQFlag());
}
@Test
public void checkRebuildCurMinNumKxQFlag1() {
HllSketch sk = buildHeapSketch(4, HLL_8, 16);
HllArray hllArr = (HllArray)(sk.hllSketchImpl);
hllArr.putRebuildCurMinNumKxQFlag(true); //corrupt the flag
Union union = buildHeapUnion(4, 0);
union.update(sk);
}
@Test
public void checkRebuildCurMinNumKxQFlag2() {
HllSketch sk = buildMemorySketch(4, HLL_8, 16);
DirectHllArray hllArr = (DirectHllArray)(sk.hllSketchImpl);
hllArr.putRebuildCurMinNumKxQFlag(true); //corrupt the flag
WritableMemory wmem = sk.getWritableMemory();
Union.writableWrap(wmem);
}
@Test(expectedExceptions = SketchesStateException.class)
public void checkHllMergeToException() {
HllSketch src = buildHeapSketch(4, HLL_8, 16);
HllSketch tgt = buildHeapSketch(4, HLL_8, 16);
AbstractHllArray absHllArr = (AbstractHllArray)(src.hllSketchImpl);
absHllArr.mergeTo(tgt);
}
private static double errorFactor(int lgK, boolean oooFlag, double numStdDev) {
double f;
if (oooFlag) {
f = (1.04 * numStdDev) / Math.sqrt(1 << lgK);
} else {
f = (0.9 * numStdDev) / Math.sqrt(1 << lgK);
}
return f;
}
//BUILDERS
private Union buildHeapUnion(int lgMaxK, int n) {
Union u = new Union(lgMaxK);
for (int i = 0; i < n; i++) { u.update(i + v); }
v += n;
return u;
}
private Union buildMemoryUnion(int lgMaxK, int n) {
final int bytes = HllSketch.getMaxUpdatableSerializationBytes(lgMaxK, TgtHllType.HLL_8);
WritableMemory wmem = WritableMemory.allocate(bytes);
Union u = new Union(lgMaxK, wmem);
for (int i = 0; i < n; i++) { u.update(i + v); }
v += n;
return u;
}
private HllSketch buildHeapSketch(int lgK, TgtHllType tgtHllType, int n) {
HllSketch sk = new HllSketch(lgK, tgtHllType);
for (int i = 0; i < n; i++) { sk.update(i + v); }
v += n;
return sk;
}
private HllSketch buildMemorySketch(int lgK, TgtHllType tgtHllType, int n) {
final int bytes = HllSketch.getMaxUpdatableSerializationBytes(lgK,tgtHllType);
WritableMemory wmem = WritableMemory.allocate(bytes);
HllSketch sk = new HllSketch(lgK, tgtHllType, wmem);
for (int i = 0; i < n; i++) { sk.update(i + v); }
v += n;
return sk;
}
@Test
public void printlnTest() {
println("PRINTING: "+this.getClass().getName());
}
/**
* @param o value to print
*/
static void println(Object o) {
print(o.toString() + "\n");
}
/**
* @param o value to print
*/
static void print(Object o) {
//System.out.print(o.toString()); //disable here
}
/**
* @param fmt format
* @param args arguments
*/
static void printf(String fmt, Object...args) {
//System.out.printf(fmt, args); //disable here
}
}