blob: e3c752a4377ce879ee3989ff6f6f8cb0c37b7282 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
#include "hll.hpp"
#include <pybind11/pybind11.h>
namespace py = pybind11;
namespace datasketches {
namespace python {
hll_sketch hll_sketch_deserialize(py::bytes skBytes) {
std::string skStr = skBytes; // implicit cast
return hll_sketch::deserialize(skStr.c_str(), skStr.length());
}
py::object hll_sketch_serialize_compact(const hll_sketch& sk) {
auto serResult = sk.serialize_compact();
return py::bytes((char*)serResult.data(), serResult.size());
}
py::object hll_sketch_serialize_updatable(const hll_sketch& sk) {
auto serResult = sk.serialize_updatable();
return py::bytes((char*)serResult.data(), serResult.size());
}
}
}
namespace dspy = datasketches::python;
void init_hll(py::module &m) {
using namespace datasketches;
py::enum_<target_hll_type>(m, "tgt_hll_type", "Target HLL flavor")
.value("HLL_4", HLL_4)
.value("HLL_6", HLL_6)
.value("HLL_8", HLL_8)
.export_values();
py::class_<hll_sketch>(m, "hll_sketch")
.def(py::init<int>(), py::arg("lg_k"))
.def(py::init<int, target_hll_type>(), py::arg("lg_k"), py::arg("tgt_type"))
.def(py::init<int, target_hll_type, bool>(), py::arg("lg_k"), py::arg("tgt_type"), py::arg("start_max_size")=false)
.def_static("deserialize", &dspy::hll_sketch_deserialize)
.def("serialize_compact", &dspy::hll_sketch_serialize_compact)
.def("serialize_updatable", &dspy::hll_sketch_serialize_updatable)
.def("__str__", (std::string (hll_sketch::*)(bool,bool,bool,bool) const) &hll_sketch::to_string,
py::arg("summary")=true, py::arg("detail")=false, py::arg("aux_detail")=false, py::arg("all")=false)
.def("to_string", (std::string (hll_sketch::*)(bool,bool,bool,bool) const) &hll_sketch::to_string,
py::arg("summary")=true, py::arg("detail")=false, py::arg("aux_detail")=false, py::arg("all")=false)
.def_property_readonly("lg_config_k", &hll_sketch::get_lg_config_k)
.def_property_readonly("tgt_type", &hll_sketch::get_target_type)
.def("get_estimate", &hll_sketch::get_estimate)
.def("get_lower_bound", &hll_sketch::get_lower_bound, py::arg("num_std_devs"))
.def("get_upper_bound", &hll_sketch::get_upper_bound, py::arg("num_std_devs"))
.def("is_compact", &hll_sketch::is_compact)
.def("is_empty", &hll_sketch::is_empty)
.def("get_updatable_serialization_bytes", &hll_sketch::get_updatable_serialization_bytes)
.def("get_compact_serialization_bytes", &hll_sketch::get_compact_serialization_bytes)
.def("reset", &hll_sketch::reset)
.def("update", (void (hll_sketch::*)(int64_t)) &hll_sketch::update, py::arg("datum"))
.def("update", (void (hll_sketch::*)(double)) &hll_sketch::update, py::arg("datum"))
.def("update", (void (hll_sketch::*)(const std::string&)) &hll_sketch::update, py::arg("datum"))
.def_static("get_max_updatable_serialization_bytes", &hll_sketch::get_max_updatable_serialization_bytes,
py::arg("lg_k"), py::arg("tgt_type"))
.def_static("get_rel_err", &hll_sketch::get_rel_err,
py::arg("upper_bound"), py::arg("unioned"), py::arg("lg_k"), py::arg("num_std_devs"))
;
py::class_<hll_union>(m, "hll_union")
.def(py::init<int>(), py::arg("lg_max_k"))
.def_property_readonly("lg_config_k", &hll_union::get_lg_config_k)
.def_property_readonly("tgt_type", &hll_union::get_target_type)
.def("get_estimate", &hll_union::get_estimate)
.def("get_lower_bound", &hll_union::get_lower_bound, py::arg("num_std_devs"))
.def("get_upper_bound", &hll_union::get_upper_bound, py::arg("num_std_devs"))
.def("is_compact", &hll_union::is_compact)
.def("is_empty", &hll_union::is_empty)
.def("get_updatable_serialization_bytes", &hll_union::get_updatable_serialization_bytes)
.def("get_compact_serialization_bytes", &hll_union::get_compact_serialization_bytes)
.def("reset", &hll_union::reset)
.def("get_result", &hll_union::get_result, py::arg("tgt_type")=HLL_4)
.def<void (hll_union::*)(const hll_sketch&)>("update", &hll_union::update, py::arg("sketch"))
.def<void (hll_union::*)(int64_t)>("update", &hll_union::update, py::arg("datum"))
.def<void (hll_union::*)(double)>("update", &hll_union::update, py::arg("datum"))
.def<void (hll_union::*)(const std::string&)>("update", &hll_union::update, py::arg("datum"))
.def_static("get_max_serialization_bytes", &hll_union::get_max_serialization_bytes, py::arg("lg_k"))
.def_static("get_rel_err", &hll_union::get_rel_err,
py::arg("upper_bound"), py::arg("unioned"), py::arg("lg_k"), py::arg("num_std_devs"))
;
}