blob: c6a20cd43a32cab3b64c6d33597e757092cc617a [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include <Core/Field.h>
#include <DataTypes/IDataType.h>
#include <Parser/FunctionParser.h>
#include <Common/BlockTypeUtils.h>
#include <Common/CHUtil.h>
namespace DB
{
namespace ErrorCodes
{
extern const int BAD_ARGUMENTS;
}
}
namespace local_engine
{
class FunctionParserArraySlice : public FunctionParser
{
public:
explicit FunctionParserArraySlice(ParserContextPtr parser_context_) : FunctionParser(parser_context_) { }
static constexpr auto name = "slice";
String getName() const override { return name; }
const DB::ActionsDAG::Node * parse(
const substrait::Expression_ScalarFunction & substrait_func,
DB::ActionsDAG & actions_dag) const override
{
/**
parse slice(arr, start, length) as
if (isNull(arr))
null
elif (isNull(start))
null
elif (if(isNull(length)))
null
else
slice(assumeNotNull(arr), if(isNotNull(arr) and start=0) then throwIf(isNotNull(arr) and start=0) else start, if (isNotNull(arr) and length<0) then throwIf(length<0) else length)
Main differences between CH arraySlice and Spark slice
1. Spark slice throws exception if start = 0 or length < 0
2. Spark slice returns null if any of the argument is null
*/
auto parsed_args = parseFunctionArguments(substrait_func, actions_dag);
if (parsed_args.size() != 3)
throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Function {} requires exactly three arguments", getName());
const auto * arr_arg = parsed_args[0];
const auto * start_arg = parsed_args[1];
const auto * length_arg = parsed_args[2];
auto is_arr_nullable = arr_arg->result_type->isNullable();
auto is_start_nullable = start_arg->result_type->isNullable();
auto is_length_nullable = length_arg->result_type->isNullable();
const auto * arr_not_null_node = toFunctionNode(actions_dag, "isNotNull", {arr_arg});
const auto * zero_const_node = addColumnToActionsDAG(actions_dag, std::make_shared<DB::DataTypeInt32>(), 0);
const auto * start_if_node = makeStartIfNode(actions_dag, start_arg, zero_const_node, arr_not_null_node);
const auto * length_if_node = makeLengthIfNode(actions_dag, length_arg, zero_const_node, arr_not_null_node);
if (!is_arr_nullable && !is_start_nullable && !is_length_nullable)
{
// slice(arr, if (start=0) then throwIf(start=0) else start, if (length<0) then throwIf(length<0) else length)
return toFunctionNode(actions_dag, "arraySlice", {arr_arg, start_if_node, length_if_node});
}
// There is at least one nullable argument, should return nullable result
const auto * arr_denull_node = is_arr_nullable ? toFunctionNode(actions_dag, "assumeNotNull", {arr_arg}) : arr_arg;
const auto * slice_node = toFunctionNode(actions_dag, "arraySlice", {arr_denull_node, start_if_node, length_if_node});
DB::DataTypePtr wrap_arr_nullable_type = wrapNullableType(true, slice_node->result_type);
const auto * wrap_slice_node = ActionsDAGUtil::convertNodeType(
actions_dag, slice_node, wrap_arr_nullable_type, slice_node->result_name);
const auto * null_const_node = addColumnToActionsDAG(actions_dag, wrap_arr_nullable_type, DB::Field{});
const auto * arr_is_null_node = toFunctionNode(actions_dag, "isNull", {arr_arg});
const auto * start_is_null_node = toFunctionNode(actions_dag, "isNull", {start_arg});
const auto * length_is_null_node = toFunctionNode(actions_dag, "isNull", {length_arg});
const auto * or_condition_node = toFunctionNode(actions_dag, "or", {arr_is_null_node, start_is_null_node, length_is_null_node});
const auto * if_node = toFunctionNode(actions_dag, "if", {or_condition_node, null_const_node, wrap_slice_node });
return convertNodeTypeIfNeeded(substrait_func, if_node, actions_dag);
}
private:
// if(isNotNull(arr) and start=0) then throwIf(isNotNull(arr) and start=0) else start
const DB::ActionsDAG::Node * makeStartIfNode(
DB::ActionsDAG & actions_dag,
const DB::ActionsDAG::Node * start_arg,
const DB::ActionsDAG::Node * zero_const_node,
const DB::ActionsDAG::Node * arr_not_null_node) const
{
const auto * start_equal_zero_node = toFunctionNode(actions_dag, "equals", {start_arg, zero_const_node});
const auto * condition_node = toFunctionNode(actions_dag, "and", {arr_not_null_node, start_equal_zero_node});
const auto * msg_node = addColumnToActionsDAG(actions_dag, std::make_shared<DB::DataTypeString>(), "Unexpected value for start");
const auto * throw_if_node = toFunctionNode(actions_dag, "throwIf", {condition_node, msg_node});
return toFunctionNode(actions_dag, "if", {condition_node, throw_if_node, start_arg});
}
// if (isNotNull(arr) and length<0) then throwIf(length<0) else length)
const DB::ActionsDAG::Node * makeLengthIfNode(
DB::ActionsDAG & actions_dag,
const DB::ActionsDAG::Node * length_arg,
const DB::ActionsDAG::Node * zero_const_node,
const DB::ActionsDAG::Node * arr_not_null_node) const
{
const auto * length_less_zero_node = toFunctionNode(actions_dag, "less", {length_arg, zero_const_node});
const auto * condition_node = toFunctionNode(actions_dag, "and", {arr_not_null_node, length_less_zero_node});
const auto * msg_node = addColumnToActionsDAG(actions_dag, std::make_shared<DB::DataTypeString>(), "Unexpected value for length");
const auto * throw_if_node = toFunctionNode(actions_dag, "throwIf", {condition_node, msg_node});
return toFunctionNode(actions_dag, "if", {condition_node, throw_if_node, length_arg});
}
};
static FunctionParserRegister<FunctionParserArraySlice> register_array_slice;
}