blob: f177fb31a89b32947dcd367483797b962b9fea35 [file] [log] [blame]
/*
* Copyright 2018, Oath Inc.
* Licensed under the terms of the Apache License 2.0. See LICENSE file at the project root for terms.
*/
package com.yahoo.sketches.hive.kll;
import org.apache.hadoop.hive.ql.exec.Description;
import org.apache.hadoop.hive.ql.exec.UDFArgumentException;
import org.apache.hadoop.hive.ql.metadata.HiveException;
import org.apache.hadoop.hive.ql.parse.SemanticException;
import org.apache.hadoop.hive.ql.udf.generic.AbstractGenericUDAFResolver;
import org.apache.hadoop.hive.ql.udf.generic.GenericUDAFEvaluator;
import org.apache.hadoop.hive.ql.udf.generic.GenericUDAFParameterInfo;
import org.apache.hadoop.hive.serde2.objectinspector.ObjectInspector;
import org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector.PrimitiveCategory;
import org.apache.hadoop.hive.serde2.objectinspector.primitive.PrimitiveObjectInspectorUtils;
@Description(name = "DataToSketch", value = "_FUNC_(value, k) - "
+ "Returns a KllFloatsSketch in a serialized form as a binary blob."
+ " Values must be of type float."
+ " Parameter k controls the accuracy and the size of the sketch."
+ " If k is ommitted, the default is used.")
@SuppressWarnings("javadoc")
public class DataToSketchUDAF extends AbstractGenericUDAFResolver {
@Override
public GenericUDAFEvaluator getEvaluator(final GenericUDAFParameterInfo info)
throws SemanticException {
final ObjectInspector[] inspectors = info.getParameterObjectInspectors();
if ((inspectors.length != 1) && (inspectors.length != 2)) {
throw new UDFArgumentException("One or two arguments expected");
}
ObjectInspectorValidator.validateGivenPrimitiveCategory(inspectors[0], 0,
PrimitiveCategory.FLOAT);
if (inspectors.length == 2) {
ObjectInspectorValidator.validateGivenPrimitiveCategory(inspectors[1], 1,
PrimitiveCategory.INT);
}
return new DataToSketchEvaluator();
}
static class DataToSketchEvaluator extends SketchEvaluator {
@SuppressWarnings("deprecation")
@Override
public void iterate(final AggregationBuffer buf, final Object[] data) throws HiveException {
if (data[0] == null) { return; }
final SketchState state = (SketchState) buf;
if (!state.isInitialized()) {
if (kInspector_ != null) {
state.init(PrimitiveObjectInspectorUtils.getInt(data[1], kInspector_));
} else {
state.init();
}
}
final float value = (float) inputInspector_.getPrimitiveJavaObject(data[0]);
state.update(value);
}
}
}