| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.datasketches.hll; |
| |
| import static org.apache.datasketches.hll.CurMode.HLL; |
| import static org.apache.datasketches.hll.CurMode.LIST; |
| import static org.apache.datasketches.hll.CurMode.SET; |
| import static org.apache.datasketches.hll.TgtHllType.HLL_4; |
| import static org.apache.datasketches.hll.TgtHllType.HLL_6; |
| import static org.apache.datasketches.hll.TgtHllType.HLL_8; |
| import static org.testng.Assert.assertEquals; |
| import static org.testng.Assert.assertFalse; |
| import static org.testng.Assert.assertTrue; |
| |
| import org.testng.annotations.Test; |
| |
| import org.apache.datasketches.memory.WritableMemory; |
| |
| /** |
| * @author Lee Rhodes |
| */ |
| @SuppressWarnings("javadoc") |
| public class DirectUnionCaseTest { |
| long v = 0; |
| |
| @Test |
| public void checkCase0() { //src: LIST, gadget: LIST, cases 0, 0 |
| int n1 = 2; |
| int n2 = 3; |
| int n3 = 2; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); |
| HllSketch h2 = build(11, HLL_6, n2); |
| HllSketch h3 = build(10, HLL_8, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| assertEquals(u.getLgConfigK(), 12); |
| assertFalse(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase1() { //src: SET, gadget: LIST, cases 0, 1 |
| int n1 = 5; |
| int n2 = 2; |
| int n3 = 16; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST, 5 |
| HllSketch h2 = build(11, HLL_6, n2); //LIST, 2 |
| HllSketch h3 = build(10, HLL_8, n3); //SET |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| assertEquals(u.getLgConfigK(), 12); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| |
| } |
| |
| @Test |
| public void checkCase2() { //src: HLL, gadget: LIST, swap, cases 0, 2 |
| int n1 = 5; |
| int n2 = 2; |
| int n3 = 97; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); |
| HllSketch h2 = build(11, HLL_8, n2); |
| HllSketch h3 = build(10, HLL_4, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 10); |
| assertFalse(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase2B() { //src: HLL, gadget: LIST, swap, cases 0, 2; different lgKs |
| int n1 = 5; |
| int n2 = 2; |
| int n3 = 769; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); |
| HllSketch h2 = build(11, HLL_8, n2); |
| HllSketch h3 = build(13, HLL_4, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 12); |
| assertFalse(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase4() { //src: LIST, gadget: SET, cases 0, 4 |
| int n1 = 6; |
| int n2 = 10; |
| int n3 = 6; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); |
| HllSketch h2 = build(11, HLL_6, n2); //SET |
| HllSketch h3 = build(10, HLL_8, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| assertEquals(u.getLgConfigK(), 12); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase5() { //src: SET, gadget: SET, cases 0, 5 |
| int n1 = 6; |
| int n2 = 10; |
| int n3 = 16; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); |
| HllSketch h2 = build(11, HLL_6, n2); |
| HllSketch h3 = build(10, HLL_8, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| assertEquals(u.getLgConfigK(), 12); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase6() { //src: HLL, gadget: SET, swap, cases 1, 6 |
| int n1 = 2; |
| int n2 = 192; |
| int n3 = 97; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); |
| HllSketch h2 = build(11, HLL_8, n2); |
| HllSketch h3 = build(10, HLL_4, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 10); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase6B() { //src: HLL, gadget: SET, swap, downsize, cases 1, 6 |
| int n1 = 6; |
| int n2 = 20; |
| int n3 = 769; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); |
| HllSketch h2 = build(11, HLL_8, n2); |
| HllSketch h3 = build(13, HLL_4, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 12); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase8() { //src: LIST, gadget: HLL, cases 2 (swap), 8 |
| int n1 = 6; |
| int n2 = 193; |
| int n3 = 7; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST |
| HllSketch h2 = build(11, HLL_6, n2); //HLL |
| HllSketch h3 = build(10, HLL_8, n3); //LIST |
| u.update(h2); //SET |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 11); |
| assertFalse(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase9() { //src: SET, gadget: HLL, cases 2 (swap), 9 |
| int n1 = 6; |
| int n2 = 193; |
| int n3 = 16; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST |
| HllSketch h2 = build(11, HLL_6, n2); //HLL |
| HllSketch h3 = build(10, HLL_8, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 11); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase10() { //src: HLL, gadget: HLL, cases 2 (swap), 10, downsample |
| int n1 = 6; |
| int n2 = 193; |
| int n3 = 97; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST |
| HllSketch h2 = build(11, HLL_6, n2); //HLL |
| HllSketch h3 = build(10, HLL_8, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 10); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase10B() { //src: HLL, gadget: HLL, cases 2 (swap), 10, copy to HLL_8 |
| int n1 = 6; |
| int n2 = 193; |
| int n3 = 193; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST |
| HllSketch h2 = build(11, HLL_6, n2); //HLL_6 |
| HllSketch h3 = build(11, HLL_8, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 11); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase12() { //src: LIST, gadget: empty, case 12 |
| int n1 = 0; |
| int n2 = 0; |
| int n3 = 7; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST empty |
| HllSketch h2 = build(11, HLL_6, n2); //LIST empty, ignored |
| HllSketch h3 = build(10, HLL_8, n3); //Src LIST |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| assertEquals(u.getLgConfigK(), 12); |
| assertFalse(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase13() { //src: SET, gadget: empty, case 13 |
| int n1 = 0; |
| int n2 = 0; |
| int n3 = 16; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST empty |
| HllSketch h2 = build(11, HLL_6, n2); //LIST empty, ignored |
| HllSketch h3 = build(10, HLL_8, n3); // Src Set |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), SET); |
| assertEquals(u.getLgConfigK(), 12); |
| assertTrue(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase14() { //src: HLL, gadget: empty, case 14 |
| int n1 = 0; |
| int n2 = 0; |
| int n3 = 97; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST empty |
| HllSketch h2 = build(11, HLL_6, n2); //LIST empty |
| HllSketch h3 = build(10, HLL_8, n3); // Src HLL |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 10); |
| assertFalse(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkCase14B() { //src: HLL, gadget: empty, case 14, downsize |
| int n1 = 0; |
| int n2 = 0; |
| int n3 = 385; |
| int sum = n1 + n2 + n3; |
| Union u = buildUnion(12, n1); //LIST empty |
| HllSketch h2 = build(11, HLL_6, n2); //LIST empty |
| HllSketch h3 = build(12, HLL_8, n3); |
| u.update(h2); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), LIST); |
| u.update(h3); |
| println(u.toString()); |
| assertEquals(u.getCurMode(), HLL); |
| assertEquals(u.getLgConfigK(), 12); |
| assertFalse(u.isOutOfOrderFlag()); |
| double err = sum * errorFactor(u.getLgConfigK(), u.isOutOfOrderFlag(), 2.0); |
| println("ErrToll: " + err); |
| assertEquals(u.getEstimate(), sum, err); |
| } |
| |
| @Test |
| public void checkMisc() { |
| Union u = buildUnion(12, 0); |
| int bytes = u.getCompactSerializationBytes(); |
| assertEquals(bytes, 8); |
| bytes = Union.getMaxSerializationBytes(7); |
| assertEquals(bytes, 40 + 128); |
| double v = u.getEstimate(); |
| assertEquals(v, 0.0, 0.0); |
| v = u.getLowerBound(1); |
| assertEquals(v, 0.0, 0.0); |
| v = u.getUpperBound(1); |
| assertEquals(v, 0.0, 0.0); |
| assertTrue(u.isEmpty()); |
| u.reset(); |
| assertTrue(u.isEmpty()); |
| println(u.toString(true, false, false, false)); |
| byte[] bArr = u.toCompactByteArray(); |
| assertEquals(bArr.length, 8); |
| } |
| |
| private static double errorFactor(int lgK, boolean oooFlag, double numStdDev) { |
| double f; |
| if (oooFlag) { |
| f = (1.2 * numStdDev) / Math.sqrt(1 << lgK); |
| } else { |
| f = (0.9 * numStdDev) / Math.sqrt(1 << lgK); |
| } |
| return f; |
| } |
| |
| private Union buildUnion(int lgMaxK, int n) { |
| final int bytes = HllSketch.getMaxUpdatableSerializationBytes(lgMaxK, TgtHllType.HLL_8); |
| WritableMemory wmem = WritableMemory.allocate(bytes); |
| Union u = new Union(lgMaxK, wmem); |
| for (int i = 0; i < n; i++) { u.update(i + v); } |
| v += n; |
| return u; |
| } |
| |
| private HllSketch build(int lgK, TgtHllType tgtHllType, int n) { |
| final int bytes = HllSketch.getMaxUpdatableSerializationBytes(lgK, tgtHllType); |
| WritableMemory wmem = WritableMemory.allocate(bytes); |
| HllSketch sk = new HllSketch(lgK, tgtHllType, wmem); |
| for (int i = 0; i < n; i++) { sk.update(i + v); } |
| v += n; |
| return sk; |
| } |
| |
| @Test |
| public void printlnTest() { |
| println("PRINTING: "+this.getClass().getName()); |
| } |
| |
| /** |
| * @param s value to print |
| */ |
| static void println(String s) { |
| //System.out.println(s); //disable here |
| } |
| |
| |
| } |