| // Licensed to the Apache Software Foundation (ASF) under one |
| // or more contributor license agreements. See the NOTICE file |
| // distributed with this work for additional information |
| // regarding copyright ownership. The ASF licenses this file |
| // to you under the Apache License, Version 2.0 (the |
| // "License"); you may not use this file except in compliance |
| // with the License. You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, |
| // software distributed under the License is distributed on an |
| // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| // KIND, either express or implied. See the License for the |
| // specific language governing permissions and limitations |
| // under the License. |
| |
| #pragma once |
| |
| #include <fmt/core.h> |
| #include <gen_cpp/Opcodes_types.h> |
| #include <glog/logging.h> |
| #include <math.h> |
| |
| #include "common/logging.h" |
| #include "olap/olap_tuple.h" |
| #include "runtime/primitive_type.h" |
| |
| namespace doris { |
| |
| using CompareLargeFunc = bool (*)(const void*, const void*); |
| |
| static const char* NEGATIVE_INFINITY = "-oo"; |
| static const char* POSITIVE_INFINITY = "+oo"; |
| |
| struct OlapScanRange { |
| public: |
| OlapScanRange() : begin_include(true), end_include(true) { |
| begin_scan_range.add_value(NEGATIVE_INFINITY); |
| end_scan_range.add_value(POSITIVE_INFINITY); |
| } |
| OlapScanRange(bool begin, bool end, std::vector<std::string>& begin_range, |
| std::vector<std::string>& end_range) |
| : begin_include(begin), |
| end_include(end), |
| begin_scan_range(begin_range), |
| end_scan_range(end_range) {} |
| |
| bool begin_include; |
| bool end_include; |
| OlapTuple begin_scan_range; |
| OlapTuple end_scan_range; |
| |
| std::string debug_string() const { |
| fmt::memory_buffer buf; |
| DCHECK_EQ(begin_scan_range.size(), end_scan_range.size()); |
| for (int i = 0; i < begin_scan_range.size(); i++) { |
| fmt::format_to(buf, "({}, {})\n", begin_scan_range[i], end_scan_range[i]); |
| } |
| return fmt::to_string(buf); |
| } |
| }; |
| |
| static char encoding_table[] = {'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', |
| 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z', |
| 'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm', |
| 'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z', |
| '0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '+', '/'}; |
| |
| static int mod_table[] = {0, 2, 1}; |
| static const char base64_pad = '='; |
| |
| inline size_t base64_encode(const char* data, size_t length, char* encoded_data) { |
| size_t output_length = (size_t)(4.0 * ceil((double)length / 3.0)); |
| |
| if (encoded_data == nullptr) { |
| return 0; |
| } |
| |
| for (uint32_t i = 0, j = 0; i < length;) { |
| uint32_t octet_a = i < length ? (unsigned char)data[i++] : 0; |
| uint32_t octet_b = i < length ? (unsigned char)data[i++] : 0; |
| uint32_t octet_c = i < length ? (unsigned char)data[i++] : 0; |
| |
| uint32_t triple = (octet_a << 0x10) + (octet_b << 0x08) + octet_c; |
| |
| encoded_data[j++] = encoding_table[(triple >> 3 * 6) & 0x3F]; |
| encoded_data[j++] = encoding_table[(triple >> 2 * 6) & 0x3F]; |
| encoded_data[j++] = encoding_table[(triple >> 1 * 6) & 0x3F]; |
| encoded_data[j++] = encoding_table[(triple >> 0 * 6) & 0x3F]; |
| } |
| |
| for (int i = 0; i < mod_table[length % 3]; i++) { |
| encoded_data[output_length - 1 - i] = base64_pad; |
| } |
| |
| return output_length; |
| } |
| |
| enum SQLFilterOp { |
| FILTER_LARGER = 0, |
| FILTER_LARGER_OR_EQUAL = 1, |
| FILTER_LESS = 2, |
| FILTER_LESS_OR_EQUAL = 3, |
| FILTER_IN = 4, |
| FILTER_NOT_IN = 5 |
| }; |
| |
| template <PrimitiveType> |
| constexpr bool always_false_v = false; |
| |
| inline SQLFilterOp to_olap_filter_type(TExprOpcode::type type, bool opposite) { |
| switch (type) { |
| case TExprOpcode::LT: |
| return opposite ? FILTER_LARGER : FILTER_LESS; |
| |
| case TExprOpcode::LE: |
| return opposite ? FILTER_LARGER_OR_EQUAL : FILTER_LESS_OR_EQUAL; |
| |
| case TExprOpcode::GT: |
| return opposite ? FILTER_LESS : FILTER_LARGER; |
| |
| case TExprOpcode::GE: |
| return opposite ? FILTER_LESS_OR_EQUAL : FILTER_LARGER_OR_EQUAL; |
| |
| case TExprOpcode::EQ: |
| return opposite ? FILTER_NOT_IN : FILTER_IN; |
| |
| case TExprOpcode::NE: |
| return opposite ? FILTER_IN : FILTER_NOT_IN; |
| |
| case TExprOpcode::EQ_FOR_NULL: |
| return FILTER_IN; |
| |
| default: |
| VLOG_CRITICAL << "TExprOpcode: " << type; |
| DCHECK(false); |
| } |
| |
| return FILTER_IN; |
| } |
| |
| inline SQLFilterOp to_olap_filter_type(const std::string& function_name, bool opposite) { |
| if (function_name == "lt") { |
| return opposite ? FILTER_LARGER : FILTER_LESS; |
| } else if (function_name == "gt") { |
| return opposite ? FILTER_LESS : FILTER_LARGER; |
| } else if (function_name == "le") { |
| return opposite ? FILTER_LARGER_OR_EQUAL : FILTER_LESS_OR_EQUAL; |
| } else if (function_name == "ge") { |
| return opposite ? FILTER_LESS_OR_EQUAL : FILTER_LARGER_OR_EQUAL; |
| } else if (function_name == "eq") { |
| return opposite ? FILTER_NOT_IN : FILTER_IN; |
| } else if (function_name == "ne") { |
| return opposite ? FILTER_IN : FILTER_NOT_IN; |
| } else { |
| DCHECK(false) << "Function Name: " << function_name; |
| return FILTER_IN; |
| } |
| } |
| |
| enum class MatchType { |
| UNKNOWN = -1, |
| MATCH_ANY = 0, |
| MATCH_ALL = 1, |
| MATCH_PHRASE = 2, |
| MATCH_ELEMENT_EQ = 3, |
| MATCH_ELEMENT_LT = 4, |
| MATCH_ELEMENT_GT = 5, |
| MATCH_ELEMENT_LE = 6, |
| MATCH_ELEMENT_GE = 7, |
| MATCH_PHRASE_PREFIX = 8, |
| MATCH_REGEXP = 9, |
| }; |
| |
| inline MatchType to_match_type(TExprOpcode::type type) { |
| switch (type) { |
| case TExprOpcode::type::MATCH_ANY: |
| return MatchType::MATCH_ANY; |
| break; |
| case TExprOpcode::type::MATCH_ALL: |
| return MatchType::MATCH_ALL; |
| break; |
| case TExprOpcode::type::MATCH_PHRASE: |
| return MatchType::MATCH_PHRASE; |
| break; |
| case TExprOpcode::type::MATCH_PHRASE_PREFIX: |
| return MatchType::MATCH_PHRASE_PREFIX; |
| break; |
| case TExprOpcode::type::MATCH_REGEXP: |
| return MatchType::MATCH_REGEXP; |
| break; |
| case TExprOpcode::type::MATCH_ELEMENT_EQ: |
| return MatchType::MATCH_ELEMENT_EQ; |
| break; |
| case TExprOpcode::type::MATCH_ELEMENT_LT: |
| return MatchType::MATCH_ELEMENT_LT; |
| break; |
| case TExprOpcode::type::MATCH_ELEMENT_GT: |
| return MatchType::MATCH_ELEMENT_GT; |
| break; |
| case TExprOpcode::type::MATCH_ELEMENT_LE: |
| return MatchType::MATCH_ELEMENT_LE; |
| break; |
| case TExprOpcode::type::MATCH_ELEMENT_GE: |
| return MatchType::MATCH_ELEMENT_GE; |
| break; |
| default: |
| VLOG_CRITICAL << "TExprOpcode: " << type; |
| DCHECK(false); |
| } |
| return MatchType::MATCH_ANY; |
| } |
| |
| inline MatchType to_match_type(const std::string& condition_op) { |
| if (condition_op.compare("match_any") == 0) { |
| return MatchType::MATCH_ANY; |
| } else if (condition_op.compare("match_all") == 0) { |
| return MatchType::MATCH_ALL; |
| } else if (condition_op.compare("match_phrase") == 0) { |
| return MatchType::MATCH_PHRASE; |
| } else if (condition_op.compare("match_phrase_prefix") == 0) { |
| return MatchType::MATCH_PHRASE_PREFIX; |
| } else if (condition_op.compare("match_regexp") == 0) { |
| return MatchType::MATCH_REGEXP; |
| } else if (condition_op.compare("match_element_eq") == 0) { |
| return MatchType::MATCH_ELEMENT_EQ; |
| } else if (condition_op.compare("match_element_lt") == 0) { |
| return MatchType::MATCH_ELEMENT_LT; |
| } else if (condition_op.compare("match_element_gt") == 0) { |
| return MatchType::MATCH_ELEMENT_GT; |
| } else if (condition_op.compare("match_element_le") == 0) { |
| return MatchType::MATCH_ELEMENT_LE; |
| } else if (condition_op.compare("match_element_ge") == 0) { |
| return MatchType::MATCH_ELEMENT_GE; |
| } |
| return MatchType::UNKNOWN; |
| } |
| |
| inline bool is_match_condition(const std::string& op) { |
| if (0 == strcasecmp(op.c_str(), "match_any") || 0 == strcasecmp(op.c_str(), "match_all") || |
| 0 == strcasecmp(op.c_str(), "match_phrase") || |
| 0 == strcasecmp(op.c_str(), "match_phrase_prefix") || |
| 0 == strcasecmp(op.c_str(), "match_regexp") || |
| 0 == strcasecmp(op.c_str(), "match_element_eq") || |
| 0 == strcasecmp(op.c_str(), "match_element_lt") || |
| 0 == strcasecmp(op.c_str(), "match_element_gt") || |
| 0 == strcasecmp(op.c_str(), "match_element_le") || |
| 0 == strcasecmp(op.c_str(), "match_element_ge")) { |
| return true; |
| } |
| return false; |
| } |
| |
| inline bool is_match_operator(const TExprOpcode::type& op_type) { |
| return TExprOpcode::MATCH_ANY == op_type || TExprOpcode::MATCH_ALL == op_type || |
| TExprOpcode::MATCH_PHRASE == op_type || TExprOpcode::MATCH_PHRASE_PREFIX == op_type || |
| TExprOpcode::MATCH_REGEXP == op_type || TExprOpcode::MATCH_ELEMENT_EQ == op_type || |
| TExprOpcode::MATCH_ELEMENT_LT == op_type || TExprOpcode::MATCH_ELEMENT_GT == op_type || |
| TExprOpcode::MATCH_ELEMENT_LE == op_type || TExprOpcode::MATCH_ELEMENT_GE == op_type; |
| } |
| |
| } // namespace doris |