blob: de92ba312a50db3ad0b0cbc5d34d9d2fe538995a [file] [log] [blame]
/*
* Copyright 2019, Verizon Media.
* Licensed under the terms of the Apache License 2.0. See LICENSE file at the project root for terms.
*/
package com.yahoo.sketches.pig.cpc;
import org.apache.pig.EvalFunc;
import org.apache.pig.data.DataByteArray;
import org.apache.pig.data.DataType;
import org.apache.pig.data.Tuple;
import org.apache.pig.data.TupleFactory;
import org.apache.pig.impl.logicalLayer.schema.Schema;
import org.testng.Assert;
import org.testng.annotations.Test;
import com.yahoo.sketches.cpc.CpcSketch;
public class GetEstimateAndErrorBoundsTest {
private static final TupleFactory TUPLE_FACTORY = TupleFactory.getInstance();
@Test
public void nullInputTuple() throws Exception {
final EvalFunc<Tuple> func = new GetEstimateAndErrorBounds();
final Tuple result = func.exec(null);
Assert.assertNull(result);
}
@Test
public void emptyInputTuple() throws Exception {
final EvalFunc<Tuple> func = new GetEstimateAndErrorBounds();
final Tuple result = func.exec(TUPLE_FACTORY.newTuple());
Assert.assertNull(result);
}
@Test
public void normalCase() throws Exception {
final EvalFunc<Tuple> func = new GetEstimateAndErrorBounds();
final CpcSketch sketch = new CpcSketch();
sketch.update(1);
sketch.update(2);
Tuple result = func.exec(TUPLE_FACTORY.newTuple(new DataByteArray(sketch.toByteArray())));
Assert.assertNotNull(result);
Assert.assertEquals((Double) result.get(0), 2.0, 0.01);
Assert.assertTrue((Double) result.get(1) <= 2.0);
Assert.assertTrue((Double) result.get(2) >= 2.0);
}
@Test
public void normalCaseWithKappa() throws Exception {
final EvalFunc<Tuple> func = new GetEstimateAndErrorBounds("1");
final CpcSketch sketch = new CpcSketch();
sketch.update(1);
sketch.update(2);
Tuple result = func.exec(TUPLE_FACTORY.newTuple(new DataByteArray(sketch.toByteArray())));
Assert.assertNotNull(result);
Assert.assertEquals((Double) result.get(0), 2.0, 0.01);
Assert.assertTrue((Double) result.get(1) <= 2.0);
Assert.assertTrue((Double) result.get(2) >= 2.0);
}
@Test
public void normalCaseWithKappaAndSeed() throws Exception {
final EvalFunc<Tuple> func = new GetEstimateAndErrorBounds("3", "123");
final CpcSketch sketch = new CpcSketch(12, 123);
sketch.update(1);
sketch.update(2);
Tuple result = func.exec(TUPLE_FACTORY.newTuple(new DataByteArray(sketch.toByteArray())));
Assert.assertNotNull(result);
Assert.assertEquals((Double) result.get(0), 2.0, 0.01);
Assert.assertTrue((Double) result.get(1) <= 2.0);
Assert.assertTrue((Double) result.get(2) >= 2.0);
}
@Test
public void schema() throws Exception {
EvalFunc<Tuple> func = new GetEstimateAndErrorBounds();
Schema inputSchema = new Schema(new Schema.FieldSchema("Sketch", DataType.BYTEARRAY));
Schema outputSchema = func.outputSchema(inputSchema);
Assert.assertNotNull(outputSchema);
Assert.assertEquals(outputSchema.size(), 1);
Assert.assertEquals(DataType.findTypeName(outputSchema.getField(0).type), "tuple");
Schema innerSchema = outputSchema.getField(0).schema;
Assert.assertEquals(innerSchema.size(), 3);
Assert.assertEquals(DataType.findTypeName(innerSchema.getField(0).type), "double");
Assert.assertEquals(DataType.findTypeName(innerSchema.getField(1).type), "double");
Assert.assertEquals(DataType.findTypeName(innerSchema.getField(2).type), "double");
}
}