| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| #pragma once |
| |
| #include <cassert> |
| #include <cstdint> |
| #include <memory> |
| #include <string> |
| #include <string_view> |
| #include <type_traits> |
| #include <utility> |
| #include <variant> |
| |
| #include "arrow/api.h" |
| #include "fmt/format.h" |
| #include "paimon/common/data/binary_string.h" |
| #include "paimon/data/decimal.h" |
| #include "paimon/data/timestamp.h" |
| #include "paimon/defs.h" |
| #include "paimon/memory/bytes.h" |
| #include "paimon/predicate/literal.h" |
| #include "paimon/result.h" |
| #include "paimon/status.h" |
| |
| namespace paimon { |
| class InternalArray; |
| class InternalRow; |
| class InternalMap; |
| |
| /// std::monostate indicates null |
| using NullType = std::monostate; |
| using VariantType = |
| std::variant<NullType, bool, char, int16_t, int32_t, int64_t, float, double, BinaryString, |
| std::shared_ptr<Bytes>, Timestamp, Decimal, std::shared_ptr<InternalRow>, |
| std::shared_ptr<InternalArray>, std::shared_ptr<InternalMap>, std::string_view>; |
| class DataDefine { |
| public: |
| DataDefine() = delete; |
| ~DataDefine() = delete; |
| inline static bool IsVariantNull(const VariantType& value) { |
| return std::holds_alternative<NullType>(value); |
| } |
| |
| // @warning Always make sure value is T type |
| template <typename T> |
| inline static T GetVariantValue(const VariantType& value) { |
| const T* ptr = std::get_if<T>(&value); |
| assert(ptr); |
| return *ptr; |
| } |
| |
| /// if value type mismatch T, return nullptr |
| template <typename T> |
| inline static const T* GetVariantPtr(const VariantType& value) { |
| return std::get_if<T>(&value); |
| } |
| |
| // @warning Always make sure value is string_view or std::shared_ptr<Bytes> or BinaryString |
| inline static std::string_view GetStringView(const VariantType& value) { |
| if (auto* view_ptr = GetVariantPtr<std::string_view>(value)) { |
| return *view_ptr; |
| } else if (auto* bytes_ptr = GetVariantPtr<std::shared_ptr<Bytes>>(value)) { |
| const auto& bytes = *bytes_ptr; |
| return std::string_view(bytes->data(), bytes->size()); |
| } else if (auto* binary_string_ptr = GetVariantPtr<BinaryString>(value)) { |
| return binary_string_ptr->GetStringView(); |
| } |
| assert(false); |
| return {}; |
| } |
| |
| static std::string VariantValueToString(const VariantType& value) { |
| return std::visit( |
| [](const auto& arg) -> std::string { |
| using T = std::decay_t<decltype(arg)>; |
| if constexpr (std::is_same_v<T, NullType>) { |
| return "null"; |
| } else if constexpr (std::is_same_v<T, bool>) { |
| return arg ? "true" : "false"; |
| } else if constexpr (std::is_same_v<T, std::shared_ptr<Bytes>>) { |
| return std::string(arg->data(), arg->size()); |
| } else if constexpr (std::is_same_v<T, // NOLINT(readability/braces) |
| BinaryString> || |
| std::is_same_v<T, Timestamp> || std::is_same_v<T, Decimal>) { |
| return arg.ToString(); |
| } else if constexpr (std::is_same_v<T, std::shared_ptr<InternalRow>>) { |
| return "row"; |
| } else if constexpr (std::is_same_v<T, std::shared_ptr<InternalArray>>) { |
| return "array"; |
| } else if constexpr (std::is_same_v<T, std::shared_ptr<InternalMap>>) { |
| return "map"; |
| } else if constexpr (std::is_same_v<T, std::string_view>) { |
| return std::string(arg); |
| } else { |
| return std::to_string(arg); |
| } |
| }, |
| value); |
| } |
| |
| static Result<Literal> VariantValueToLiteral(const VariantType& value, |
| const arrow::Type::type& arrow_type) { |
| switch (arrow_type) { |
| case arrow::Type::type::BOOL: |
| return Literal(GetVariantValue<bool>(value)); |
| case arrow::Type::type::INT8: |
| return Literal(static_cast<int8_t>(GetVariantValue<char>(value))); |
| case arrow::Type::type::INT16: |
| return Literal(GetVariantValue<int16_t>(value)); |
| case arrow::Type::type::INT32: |
| return Literal(GetVariantValue<int32_t>(value)); |
| case arrow::Type::type::INT64: |
| return Literal(GetVariantValue<int64_t>(value)); |
| case arrow::Type::type::FLOAT: |
| return Literal(GetVariantValue<float>(value)); |
| case arrow::Type::type::DOUBLE: |
| return Literal(GetVariantValue<double>(value)); |
| case arrow::Type::type::STRING: { |
| auto view = GetStringView(value); |
| return Literal(FieldType::STRING, view.data(), view.size()); |
| } |
| case arrow::Type::type::BINARY: { |
| auto view = GetStringView(value); |
| return Literal(FieldType::BINARY, view.data(), view.size()); |
| } |
| case arrow::Type::type::TIMESTAMP: |
| return Literal(GetVariantValue<Timestamp>(value)); |
| case arrow::Type::type::DECIMAL128: |
| return Literal(GetVariantValue<Decimal>(value)); |
| case arrow::Type::type::DATE32: |
| return Literal(FieldType::DATE, GetVariantValue<int32_t>(value)); |
| default: |
| return Status::Invalid( |
| fmt::format("Not support arrow type {} in VariantValueToLiteral", |
| static_cast<int32_t>(arrow_type))); |
| } |
| } |
| }; |
| } // namespace paimon |