blob: f21a7b5d94e0c3d9d99f0b2a2373ba8370d81a0e [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
// This file is copied from
// https://github.com/ClickHouse/ClickHouse/blob/master/src/Functions/array/arrayZip.cpp
// and modified by Doris
#include <fmt/format.h>
#include <glog/logging.h>
#include <stddef.h>
#include <algorithm>
#include <memory>
#include <ostream>
#include <string>
#include <utility>
#include "common/status.h"
#include "vec/aggregate_functions/aggregate_function.h"
#include "vec/columns/column.h"
#include "vec/columns/column_array.h"
#include "vec/columns/column_nullable.h"
#include "vec/columns/column_struct.h"
#include "vec/columns/column_vector.h"
#include "vec/core/block.h"
#include "vec/core/column_numbers.h"
#include "vec/core/column_with_type_and_name.h"
#include "vec/core/types.h"
#include "vec/data_types/data_type.h"
#include "vec/data_types/data_type_array.h"
#include "vec/data_types/data_type_nullable.h"
#include "vec/data_types/data_type_struct.h"
#include "vec/functions/function.h"
#include "vec/functions/function_helpers.h"
#include "vec/functions/simple_function_factory.h"
namespace doris {
class FunctionContext;
} // namespace doris
namespace doris::vectorized {
// Combines multiple arrays into a single array
// array_zip(['d', 'o', 'r', 'i', 's'], [1, 2, 3, 4, 5]) -> [('d', 1), ('o', 2), ('r', 3), ('i', 4), ('s', 5)]
class FunctionArrayZip : public IFunction {
public:
static constexpr auto name = "array_zip";
static FunctionPtr create() { return std::make_shared<FunctionArrayZip>(); }
/// Get function name.
String get_name() const override { return name; }
bool is_variadic() const override { return true; }
size_t get_number_of_arguments() const override { return 0; }
DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
DCHECK(arguments.size() > 0)
<< "function: " << get_name() << ", arguments should not be empty";
DataTypes res_data_types;
size_t num_elements = arguments.size();
for (size_t i = 0; i < num_elements; ++i) {
DCHECK(arguments[i]->get_primitive_type() == TYPE_ARRAY)
<< i << "-th element is not array type";
const auto* array_type = check_and_get_data_type<DataTypeArray>(arguments[i].get());
DCHECK(array_type) << "function: " << get_name() << " " << i + 1
<< "-th argument is not array";
res_data_types.emplace_back(
make_nullable(remove_nullable((array_type->get_nested_type()))));
}
auto res = std::make_shared<DataTypeArray>(
make_nullable(std::make_shared<DataTypeStruct>(res_data_types)));
return res;
}
Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
uint32_t result, size_t input_rows_count) const override {
size_t num_element = arguments.size();
// all the columns must have the same size as the first column
ColumnPtr first_array_column;
Columns tuple_columns(num_element);
for (size_t i = 0; i < num_element; ++i) {
auto col = block.get_by_position(arguments[i]).column;
col = col->convert_to_full_column_if_const();
const auto* column_array = check_and_get_column<ColumnArray>(col.get());
if (!column_array) {
return Status::RuntimeError(fmt::format(
"execute failed, function {}'s {}-th argument should be array bet get {}",
get_name(), i + 1, block.get_by_position(arguments[i]).type->get_name()));
}
if (i == 0) {
first_array_column = col;
} else if (!column_array->has_equal_offsets(
static_cast<const ColumnArray&>(*first_array_column))) {
return Status::RuntimeError(
fmt::format("execute failed, function {}'s {}-th argument should have same "
"offsets with first argument",
get_name(), i + 1));
}
tuple_columns[i] = column_array->get_data_ptr();
}
auto tuples = ColumnStruct::create(tuple_columns);
auto nullable_tuples =
ColumnNullable::create(std::move(tuples), ColumnUInt8::create(tuples->size(), 0));
auto res_column = ColumnArray::create(
std::move(nullable_tuples),
static_cast<const ColumnArray&>(*first_array_column).get_offsets_ptr());
block.replace_by_position(result, std::move(res_column));
return Status::OK();
}
};
void register_function_array_zip(SimpleFunctionFactory& factory) {
factory.register_function<FunctionArrayZip>();
}
} // namespace doris::vectorized