blob: 8e8b873c1e2ec49def645529d866b2599eb1c15e [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
#include "hll.hpp"
#include "CouponHashSet.hpp"
#include "HllUtil.hpp"
#include <catch.hpp>
#include <ostream>
#include <cmath>
#include <string>
#include <exception>
namespace datasketches {
TEST_CASE("coupon hash set: check corrupt bytearray", "[coupon_hash_set]") {
int lgK = 8;
hll_sketch sk1(lgK);
for (int i = 0; i < 24; ++i) {
sk1.update(i);
}
auto sketchBytes = sk1.serialize_updatable();
uint8_t* bytes = sketchBytes.data();
const size_t size = sketchBytes.size();
bytes[HllUtil<>::PREAMBLE_INTS_BYTE] = 0;
// fail in HllSketchImpl
REQUIRE_THROWS_AS(hll_sketch::deserialize(bytes, size), std::invalid_argument);
// fail in CouponHashSet
REQUIRE_THROWS_AS(CouponHashSet<>::newSet(bytes, size), std::invalid_argument);
bytes[HllUtil<>::PREAMBLE_INTS_BYTE] = HllUtil<>::HASH_SET_PREINTS;
bytes[HllUtil<>::SER_VER_BYTE] = 0;
REQUIRE_THROWS_AS(hll_sketch::deserialize(bytes, size), std::invalid_argument);
bytes[HllUtil<>::SER_VER_BYTE] = HllUtil<>::SER_VER;
bytes[HllUtil<>::FAMILY_BYTE] = 0;
REQUIRE_THROWS_AS(hll_sketch::deserialize(bytes, size), std::invalid_argument);
bytes[HllUtil<>::FAMILY_BYTE] = HllUtil<>::FAMILY_ID;
bytes[HllUtil<>::LG_K_BYTE] = 6;
REQUIRE_THROWS_AS(hll_sketch::deserialize(bytes, size), std::invalid_argument);
bytes[HllUtil<>::LG_K_BYTE] = lgK;
uint8_t tmp = bytes[HllUtil<>::MODE_BYTE];
bytes[HllUtil<>::MODE_BYTE] = 0x10; // HLL_6, LIST
REQUIRE_THROWS_AS(hll_sketch::deserialize(bytes, size), std::invalid_argument);
bytes[HllUtil<>::MODE_BYTE] = tmp;
tmp = bytes[HllUtil<>::LG_ARR_BYTE];
bytes[HllUtil<>::LG_ARR_BYTE] = 0;
hll_sketch::deserialize(bytes, size);
// should work fine despite the corruption
bytes[HllUtil<>::LG_ARR_BYTE] = tmp;
REQUIRE_THROWS_AS(hll_sketch::deserialize(bytes, size - 1), std::out_of_range);
REQUIRE_THROWS_AS(hll_sketch::deserialize(bytes, 3), std::out_of_range);
}
TEST_CASE("coupon hash set: check corrupt stream", "[coupon_hash_set]") {
int lgK = 9;
hll_sketch sk1(lgK);
for (int i = 0; i < 24; ++i) {
sk1.update(i);
}
std::stringstream ss;
sk1.serialize_compact(ss);
ss.seekp(HllUtil<>::PREAMBLE_INTS_BYTE);
ss.put(0);
ss.seekg(0);
// fail in HllSketchImpl
REQUIRE_THROWS_AS(hll_sketch::deserialize(ss), std::invalid_argument);
// fail in CouponHashSet
REQUIRE_THROWS_AS(CouponHashSet<>::newSet(ss), std::invalid_argument);
ss.seekp(HllUtil<>::PREAMBLE_INTS_BYTE);
ss.put(HllUtil<>::HASH_SET_PREINTS);
ss.seekp(HllUtil<>::SER_VER_BYTE);
ss.put(0);
ss.seekg(0);
REQUIRE_THROWS_AS(hll_sketch::deserialize(ss), std::invalid_argument);
ss.seekp(HllUtil<>::SER_VER_BYTE);
ss.put(HllUtil<>::SER_VER);
ss.seekp(HllUtil<>::FAMILY_BYTE);
ss.put(0);
ss.seekg(0);
REQUIRE_THROWS_AS(hll_sketch::deserialize(ss), std::invalid_argument);
ss.seekp(HllUtil<>::FAMILY_BYTE);
ss.put(HllUtil<>::FAMILY_ID);
ss.seekg(HllUtil<>::MODE_BYTE);
uint8_t tmp = ss.get();
ss.seekp(HllUtil<>::MODE_BYTE);
ss.put(0x22); // HLL_8, HLL
ss.seekg(0);
REQUIRE_THROWS_AS(hll_sketch::deserialize(ss), std::invalid_argument);
ss.seekp(HllUtil<>::MODE_BYTE);
ss.put(tmp);
ss.seekg(HllUtil<>::LG_ARR_BYTE);
tmp = ss.get();
ss.seekp(HllUtil<>::LG_ARR_BYTE);
ss.put(0);
ss.seekg(0);
hll_sketch::deserialize(ss);
// should work fine despite the corruption
ss.seekp(HllUtil<>::LG_ARR_BYTE);
ss.put(tmp);
}
} // namespace datasketches