blob: 73aefdb3ea2fd22d61955457922693981f8576ff [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.datasketches.kll;
import static org.apache.datasketches.kll.KllPreambleUtil.DATA_START_ADR;
import static org.apache.datasketches.kll.KllPreambleUtil.DATA_START_ADR_SINGLE_ITEM;
import static org.apache.datasketches.kll.KllSketch.Error.NOT_SINGLE_ITEM;
import static org.apache.datasketches.kll.KllSketch.Error.kllSketchThrow;
import static org.apache.datasketches.kll.KllSketch.SketchType.FLOATS_SKETCH;
import java.util.Objects;
import org.apache.datasketches.memory.Memory;
/**
* This class implements an on-heap floats KllSketch.
*
* <p>Please refer to the documentation in the package-info:<br>
* {@link org.apache.datasketches.kll}</p>
*
* @author Lee Rhodes, Kevin Lang
*/
final class KllHeapFloatsSketch extends KllFloatsSketch {
private final int k_; // configured size of K.
private final int m_; // configured size of M.
private long n_; // number of items input into this sketch.
private int minK_; // dynamic minK for error estimation after merging with different k.
private boolean isLevelZeroSorted_;
private float minFloatItem_;
private float maxFloatItem_;
private float[] floatItems_;
/**
* New instance heap constructor with a given parameters <em>k</em> and <em>m</em>.
*
* @param k parameter that controls size of the sketch and accuracy of estimates.
* <em>k</em> can be between <em>m</em> and 65535, inclusive.
* The default <em>k</em> = 200 results in a normalized rank error of about 1.65%.
* Larger <em>k</em> will have smaller error but the sketch will be larger (and slower).
* @param m parameter controls the minimum level width in items. It can be 2, 4, 6 or 8.
* The DEFAULT_M, which is 8 is recommended. Other sizes of <em>m</em> should be considered
* experimental as they have not been as well characterized.
*/
KllHeapFloatsSketch(final int k, final int m) {
super(null, null);
KllHelper.checkM(m);
KllHelper.checkK(k, m);
this.k_ = k;
this.m_ = m;
n_ = 0;
minK_ = k;
isLevelZeroSorted_ = false;
levelsArr = new int[] {k, k};
minFloatItem_ = Float.NaN;
maxFloatItem_ = Float.NaN;
floatItems_ = new float[k];
}
/**
* Heapify constructor.
* @param srcMem Memory object that contains data serialized by this sketch.
* @param memValidate the MemoryValidate object
*/
private KllHeapFloatsSketch(final Memory srcMem, final KllMemoryValidate memValidate) {
super(null, null);
k_ = memValidate.k;
m_ = memValidate.m;
n_ = memValidate.n;
minK_ = memValidate.minK;
levelsArr = memValidate.levelsArr;
isLevelZeroSorted_ = memValidate.level0Sorted;
final boolean updatableMemFormat = memValidate.updatableMemFormat;
if (memValidate.empty && !updatableMemFormat) {
minFloatItem_ = Float.NaN;
maxFloatItem_ = Float.NaN;
floatItems_ = new float[k_];
}
else if (memValidate.singleItem && !updatableMemFormat) {
final float item = srcMem.getFloat(DATA_START_ADR_SINGLE_ITEM);
minFloatItem_ = maxFloatItem_ = item;
floatItems_ = new float[k_];
floatItems_[k_ - 1] = item;
}
else { //Full or updatableMemFormat
int offsetBytes = DATA_START_ADR;
offsetBytes += (updatableMemFormat ? levelsArr.length * Integer.BYTES : (levelsArr.length - 1) * Integer.BYTES);
minFloatItem_ = srcMem.getFloat(offsetBytes);
offsetBytes += Float.BYTES;
maxFloatItem_ = srcMem.getFloat(offsetBytes);
offsetBytes += Float.BYTES;
final int capacityItems = levelsArr[getNumLevels()];
final int retainedItems = capacityItems - levelsArr[0];
floatItems_ = new float[capacityItems];
final int shift = levelsArr[0];
if (updatableMemFormat) {
offsetBytes += shift * Float.BYTES;
srcMem.getFloatArray(offsetBytes, floatItems_, shift, retainedItems);
} else {
srcMem.getFloatArray(offsetBytes, floatItems_, shift, retainedItems);
}
}
}
static KllHeapFloatsSketch heapifyImpl(final Memory srcMem) {
Objects.requireNonNull(srcMem, "Parameter 'srcMem' must not be null");
final KllMemoryValidate memVal = new KllMemoryValidate(srcMem, FLOATS_SKETCH);
return new KllHeapFloatsSketch(srcMem, memVal);
}
@Override
public int getK() { return k_; }
@Override
public long getN() { return n_; }
@Override
float[] getFloatItemsArray() { return floatItems_; }
@Override
float getFloatSingleItem() {
if (n_ != 1L) { kllSketchThrow(NOT_SINGLE_ITEM); return Float.NaN; }
return floatItems_[k_ - 1];
}
@Override
int getM() { return m_; }
@Override
float getMaxFloatItem() { return maxFloatItem_; }
@Override
float getMinFloatItem() { return minFloatItem_; }
@Override
int getMinK() { return minK_; }
@Override
void incN() { n_++; }
@Override
void incNumLevels() { } //not used here
@Override
boolean isLevelZeroSorted() { return isLevelZeroSorted_; }
@Override
void setFloatItemsArray(final float[] floatItems) { floatItems_ = floatItems; }
@Override
void setFloatItemsArrayAt(final int index, final float item) { floatItems_[index] = item; }
@Override
void setLevelZeroSorted(final boolean sorted) { this.isLevelZeroSorted_ = sorted; }
@Override
void setMaxFloatItem(final float item) { maxFloatItem_ = item; }
@Override
void setMinFloatItem(final float item) { minFloatItem_ = item; }
@Override
void setMinK(final int minK) { minK_ = minK; }
@Override
void setN(final long n) { n_ = n; }
@Override
void setNumLevels(final int numLevels) { } //not used here
}