blob: 878033e41957eb9aeab14743041b8fe74d41d89e [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include <fmt/core.h>
#include <gtest/gtest.h>
#include <string>
#include "function_test_util.h"
#include "vec/columns/column_array.h"
#include "vec/core/types.h"
#include "vec/data_types/data_type_map.h"
namespace doris::vectorized {
TEST(FunctionMapTest, deduplicate_map) {
const std::string func_name = "deduplicate_map";
auto type_map = std::make_shared<DataTypeMap>(std::make_shared<DataTypeString>(),
std::make_shared<DataTypeInt32>());
auto argument_template = ColumnsWithTypeAndName {{nullptr, type_map, "map"}};
auto function = SimpleFunctionFactory::instance().get_function(
func_name, argument_template, type_map, {true},
BeExecVersionManager::get_newest_version());
ASSERT_TRUE(function != nullptr);
Block block;
auto key_column = ColumnString::create();
auto value_column = ColumnInt32::create();
auto offset_column = ColumnArray::ColumnOffsets::create();
const size_t count = 1024;
for (size_t i = 0; i < count; ++i) {
// keys with duplicates
auto value = int32_t(i % 8);
auto key = fmt::format("key_{}", value);
key_column->insert_data(key.data(), key.size());
value_column->insert_data(reinterpret_cast<const char*>(&value), 4);
}
const size_t rows = 32;
size_t offset = 0;
for (size_t i = 0; i < rows; ++i) {
offset += count / rows;
offset_column->insert_data(reinterpret_cast<const char*>(&offset), sizeof(offset));
}
auto column_map = ColumnMap::create(std::move(key_column), std::move(value_column),
std::move(offset_column));
block.insert({std::move(column_map), type_map, "map"});
block.insert({nullptr, type_map, "result"});
uint32_t result = 1;
auto st = function->execute(nullptr, block, {0}, result, rows);
ASSERT_TRUE(st.ok()) << "execute failed: " << st.to_string();
auto result_column = block.get_by_position(result).column;
auto& result_map_column = assert_cast<const ColumnMap&>(*result_column);
for (size_t i = 0; i < rows; ++i) {
auto map_size = result_map_column.get_offsets()[i] -
(i == 0 ? 0 : result_map_column.get_offsets()[i - 1]);
ASSERT_EQ(map_size, 8) << "deduplicate map failed at row " << i;
}
}
} // namespace doris::vectorized