blob: 5eb4552477371326b336a40efb002f733de90ec1 [file] [log] [blame]
* Druid - a distributed column store.
* Copyright (C) 2012, 2013 Metamarkets Group Inc.
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation; either version 2
* of the License, or (at your option) any later version.
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* GNU General Public License for more details.
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
package io.druid.query.aggregation.hyperloglog;
import com.fasterxml.jackson.annotation.JsonCreator;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.metamx.common.IAE;
import io.druid.query.aggregation.Aggregator;
import io.druid.query.aggregation.AggregatorFactory;
import io.druid.query.aggregation.BufferAggregator;
import io.druid.query.aggregation.NoopAggregator;
import io.druid.query.aggregation.NoopBufferAggregator;
import io.druid.segment.ColumnSelectorFactory;
import io.druid.segment.ObjectColumnSelector;
import org.apache.commons.codec.binary.Base64;
import java.nio.ByteBuffer;
import java.util.Arrays;
import java.util.Comparator;
import java.util.List;
public class HyperUniquesAggregatorFactory implements AggregatorFactory
public static Object estimateCardinality(Object object)
if (object == null) {
return 0;
return ((HyperLogLogCollector) object).estimateCardinality();
private static final byte CACHE_TYPE_ID = 0x5;
private final String name;
private final String fieldName;
public HyperUniquesAggregatorFactory(
@JsonProperty("name") String name,
@JsonProperty("fieldName") String fieldName
{ = name;
this.fieldName = fieldName.toLowerCase();
public Aggregator factorize(ColumnSelectorFactory metricFactory)
ObjectColumnSelector selector = metricFactory.makeObjectColumnSelector(fieldName);
if (selector == null) {
return new NoopAggregator(name);
if (HyperLogLogCollector.class.isAssignableFrom(selector.classOfObject())) {
return new HyperUniquesAggregator(name, selector);
throw new IAE(
"Incompatible type for metric[%s], expected a HyperUnique, got a %s", fieldName, selector.classOfObject()
public BufferAggregator factorizeBuffered(ColumnSelectorFactory metricFactory)
ObjectColumnSelector selector = metricFactory.makeObjectColumnSelector(fieldName);
if (selector == null) {
return new NoopBufferAggregator();
if (HyperLogLogCollector.class.isAssignableFrom(selector.classOfObject())) {
return new HyperUniquesBufferAggregator(selector);
throw new IAE(
"Incompatible type for metric[%s], expected a HyperUnique, got a %s", fieldName, selector.classOfObject()
public Comparator getComparator()
return new Comparator<HyperLogLogCollector>()
public int compare(HyperLogLogCollector lhs, HyperLogLogCollector rhs)
return lhs.compareTo(rhs);
public Object combine(Object lhs, Object rhs)
if (rhs == null) {
return lhs;
if (lhs == null) {
return rhs;
return ((HyperLogLogCollector) lhs).fold((HyperLogLogCollector) rhs);
public AggregatorFactory getCombiningFactory()
return new HyperUniquesAggregatorFactory(name, name);
public Object deserialize(Object object)
if (object instanceof byte[]) {
return HyperLogLogCollector.makeCollector(ByteBuffer.wrap((byte[]) object));
} else if (object instanceof ByteBuffer) {
return HyperLogLogCollector.makeCollector((ByteBuffer) object);
} else if (object instanceof String) {
return HyperLogLogCollector.makeCollector(
ByteBuffer.wrap(Base64.decodeBase64(((String) object).getBytes(Charsets.UTF_8)))
return object;
public Object finalizeComputation(Object object)
return estimateCardinality(object);
public String getName()
return name;
public List<String> requiredFields()
return Arrays.asList(fieldName);
public String getFieldName()
return fieldName;
public byte[] getCacheKey()
byte[] fieldNameBytes = fieldName.getBytes(Charsets.UTF_8);
return ByteBuffer.allocate(1 + fieldNameBytes.length).put(CACHE_TYPE_ID).put(fieldNameBytes).array();
public String getTypeName()
return "hyperUnique";
public int getMaxIntermediateSize()
return HyperLogLogCollector.getLatestNumBytesForDenseStorage();
public Object getAggregatorStartValue()
return HyperLogLogCollector.makeLatestCollector();
public String toString()
return "HyperUniquesAggregatorFactory{" +
"name='" + name + '\'' +
", fieldName='" + fieldName + '\'' +
public boolean equals(Object o)
if (this == o) return true;
if (o == null || getClass() != o.getClass()) return false;
HyperUniquesAggregatorFactory that = (HyperUniquesAggregatorFactory) o;
if (!fieldName.equals(that.fieldName)) return false;
if (!name.equals( return false;
return true;
public int hashCode()
int result = name.hashCode();
result = 31 * result + fieldName.hashCode();
return result;