| // Licensed to the Apache Software Foundation (ASF) under one |
| // or more contributor license agreements. See the NOTICE file |
| // distributed with this work for additional information |
| // regarding copyright ownership. The ASF licenses this file |
| // to you under the Apache License, Version 2.0 (the |
| // "License"); you may not use this file except in compliance |
| // with the License. You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, |
| // software distributed under the License is distributed on an |
| // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| // KIND, either express or implied. See the License for the |
| // specific language governing permissions and limitations |
| // under the License. |
| |
| #pragma once |
| |
| #include "core/data_type_serde/data_type_serde.h" |
| #include "core/types.h" |
| #include "core/value/time_value.h" |
| #include "exprs/function/cast/cast_base.h" |
| #include "util/mysql_global.h" |
| #include "util/to_string.h" |
| namespace doris { |
| #include "common/compile_check_begin.h" |
| struct CastToString { |
| template <class SRC> |
| static inline std::string from_number(const SRC& from); |
| |
| // Caller is responsible for ensuring that `buffer` has enough space. |
| template <class SRC> |
| static inline int from_number(const SRC& from, char* buffer); |
| |
| template <typename T> |
| requires(std::is_same_v<T, Float32> || std::is_same_v<T, Float64>) |
| static inline int from_number(const T& from, char* buffer); |
| |
| template <class SRC> |
| static inline void push_number(const SRC& from, ColumnString::Chars& chars); |
| |
| template <class SRC> |
| static inline void push_number(const SRC& from, BufferWritable& bw); |
| |
| template <class SRC> |
| static inline std::string from_decimal(const SRC& from, UInt32 scale); |
| |
| template <class SRC> |
| static inline void push_decimal(const SRC& from, UInt32 scale, BufferWritable& bw); |
| |
| static inline std::string from_date_or_datetime(const VecDateTimeValue& from); |
| |
| static inline void push_date_or_datetime(const VecDateTimeValue& from, |
| ColumnString::Chars& chars); |
| static inline void push_date_or_datetime(const VecDateTimeValue& from, BufferWritable& bw); |
| |
| static inline std::string from_datev2(const DateV2Value<DateV2ValueType>& from); |
| static inline void push_datev2(const DateV2Value<DateV2ValueType>& from, |
| ColumnString::Chars& chars); |
| static inline void push_datev2(const DateV2Value<DateV2ValueType>& from, BufferWritable& bw); |
| |
| static inline std::string from_datetimev2(const DateV2Value<DateTimeV2ValueType>& from, |
| UInt32 scale); |
| static inline std::string from_timestamptz(const TimestampTzValue& from, UInt32 scale, |
| const cctz::time_zone* timezone = nullptr); |
| static inline void push_datetimev2(const DateV2Value<DateTimeV2ValueType>& from, UInt32 scale, |
| ColumnString::Chars& chars); |
| |
| static inline void push_datetimev2(const DateV2Value<DateTimeV2ValueType>& from, UInt32 scale, |
| BufferWritable& bw); |
| static inline void push_timestamptz(const TimestampTzValue& from, UInt32 scale, |
| BufferWritable& bw, |
| const DataTypeSerDe::FormatOptions& options); |
| |
| template <class SRC> |
| static inline std::string from_ip(const SRC& from); |
| |
| template <class SRC> |
| static inline void push_ip(const SRC& from, BufferWritable& bw); |
| |
| static inline std::string from_time(const TimeValue::TimeType& from, UInt32 scale); |
| |
| static inline void push_time(const TimeValue::TimeType& from, UInt32 scale, BufferWritable& bw); |
| |
| template <PrimitiveType T> |
| static constexpr size_t string_length = 1; |
| |
| private: |
| // refer to: https://en.cppreference.com/w/cpp/types/numeric_limits/max_digits10.html |
| template <typename T> |
| requires(std::is_same_v<T, float> || std::is_same_v<T, double>) |
| static inline int _fast_to_buffer(T value, char* buffer) { |
| char* end = nullptr; |
| // output NaN and Infinity to be compatible with most of the implementations |
| if (std::isnan(value)) { |
| static constexpr char nan_str[] = "NaN"; |
| static constexpr int nan_str_len = sizeof(nan_str) - 1; |
| memcpy(buffer, nan_str, nan_str_len); |
| end = buffer + nan_str_len; |
| } else if (std::isinf(value)) { |
| static constexpr char inf_str[] = "Infinity"; |
| static constexpr int inf_str_len = sizeof(inf_str) - 1; |
| static constexpr char neg_inf_str[] = "-Infinity"; |
| static constexpr int neg_inf_str_len = sizeof(neg_inf_str) - 1; |
| if (value > 0) { |
| memcpy(buffer, inf_str, inf_str_len); |
| end = buffer + inf_str_len; |
| } else { |
| memcpy(buffer, neg_inf_str, neg_inf_str_len); |
| end = buffer + neg_inf_str_len; |
| } |
| } else { |
| if constexpr (std::is_same_v<T, float>) { |
| end = fmt::format_to(buffer, FMT_COMPILE("{:.{}g}"), value, |
| std::numeric_limits<float>::digits10 + 1); |
| } else { |
| end = fmt::format_to(buffer, FMT_COMPILE("{:.{}g}"), value, |
| std::numeric_limits<double>::digits10 + 1); |
| } |
| } |
| *end = '\0'; |
| return int(end - buffer); |
| } |
| }; |
| |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_BOOLEAN> = 1; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_TINYINT> = 4; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_SMALLINT> = 6; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_INT> = 11; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_BIGINT> = 20; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_LARGEINT> = 40; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_FLOAT> = MAX_FLOAT_STR_LENGTH; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DOUBLE> = MAX_DOUBLE_STR_LENGTH; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DECIMAL32> = 14; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DECIMAL64> = 24; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DECIMALV2> = 24; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DECIMAL128I> = 39; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DECIMAL256> = 78; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DATE> = sizeof("YYYY-MM-DD") - 1; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DATETIME> = sizeof("YYYY-MM-DD HH:MM:SS") - 1; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DATEV2> = sizeof("YYYY-MM-DD") - 1; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_DATETIMEV2> = |
| sizeof("YYYY-MM-DD HH:MM:SS.ssssss") - 1; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_TIMEV2> = sizeof("-838:59:59.999999") - 1; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_IPV4> = sizeof("255.255 .255.255") - 1; |
| template <> |
| constexpr size_t CastToString::string_length<TYPE_IPV6> = |
| sizeof("ffff:ffff:ffff:ffff:ffff:ffff:ffff:ffff") - 1; |
| |
| // BOOLEAN |
| template <> |
| inline std::string CastToString::from_number(const UInt8& num) { |
| auto f = fmt::format_int(num); |
| return std::string(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const UInt8& num, ColumnString::Chars& chars) { |
| auto f = fmt::format_int(num); |
| chars.insert(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const UInt8& num, BufferWritable& bw) { |
| auto f = fmt::format_int(num); |
| bw.write(f.data(), f.size()); |
| } |
| |
| // TINYINT |
| template <> |
| inline std::string CastToString::from_number(const Int8& num) { |
| auto f = fmt::format_int(num); |
| return std::string(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int8& num, ColumnString::Chars& chars) { |
| auto f = fmt::format_int(num); |
| chars.insert(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int8& num, BufferWritable& bw) { |
| auto f = fmt::format_int(num); |
| bw.write(f.data(), f.size()); |
| } |
| |
| // SMALLINT |
| template <> |
| inline std::string CastToString::from_number(const Int16& num) { |
| auto f = fmt::format_int(num); |
| return std::string(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int16& num, ColumnString::Chars& chars) { |
| auto f = fmt::format_int(num); |
| chars.insert(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int16& num, BufferWritable& bw) { |
| auto f = fmt::format_int(num); |
| bw.write(f.data(), f.size()); |
| } |
| |
| // INT |
| template <> |
| inline std::string CastToString::from_number(const Int32& num) { |
| auto f = fmt::format_int(num); |
| return std::string(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int32& num, ColumnString::Chars& chars) { |
| auto f = fmt::format_int(num); |
| chars.insert(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int32& num, BufferWritable& bw) { |
| auto f = fmt::format_int(num); |
| bw.write(f.data(), f.size()); |
| } |
| |
| // BIGINT |
| template <> |
| inline std::string CastToString::from_number(const Int64& num) { |
| auto f = fmt::format_int(num); |
| return std::string(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int64& num, ColumnString::Chars& chars) { |
| auto f = fmt::format_int(num); |
| chars.insert(f.data(), f.data() + f.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int64& num, BufferWritable& bw) { |
| auto f = fmt::format_int(num); |
| bw.write(f.data(), f.size()); |
| } |
| |
| // LARGEINT |
| template <> |
| inline std::string CastToString::from_number(const Int128& num) { |
| fmt::memory_buffer buffer; |
| fmt::format_to(buffer, "{}", num); |
| return std::string(buffer.data(), buffer.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int128& num, ColumnString::Chars& chars) { |
| fmt::memory_buffer buffer; |
| fmt::format_to(buffer, "{}", num); |
| chars.insert(buffer.data(), buffer.data() + buffer.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Int128& num, BufferWritable& bw) { |
| fmt::memory_buffer buffer; |
| fmt::format_to(buffer, "{}", num); |
| bw.write(buffer.data(), buffer.size()); |
| } |
| |
| // FLOAT |
| |
| template <> |
| inline std::string CastToString::from_number(const Float32& num) { |
| char buf[MAX_FLOAT_STR_LENGTH + 2]; |
| int len = _fast_to_buffer(num, buf); |
| return std::string(buf, buf + len); |
| } |
| |
| template <typename T> |
| requires(std::is_same_v<T, Float32> || std::is_same_v<T, Float64>) |
| inline int CastToString::from_number(const T& from, char* buffer) { |
| return _fast_to_buffer(from, buffer); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Float32& num, ColumnString::Chars& chars) { |
| char buf[MAX_FLOAT_STR_LENGTH + 2]; |
| int len = _fast_to_buffer(num, buf); |
| chars.insert(buf, buf + len); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Float32& num, BufferWritable& bw) { |
| char buf[MAX_FLOAT_STR_LENGTH + 2]; |
| int len = _fast_to_buffer(num, buf); |
| bw.write(buf, len); |
| } |
| |
| // DOUBLE |
| template <> |
| inline std::string CastToString::from_number(const Float64& num) { |
| char buf[MAX_DOUBLE_STR_LENGTH + 2]; |
| int len = _fast_to_buffer(num, buf); |
| return std::string(buf, len); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Float64& num, ColumnString::Chars& chars) { |
| char buf[MAX_DOUBLE_STR_LENGTH + 2]; |
| int len = _fast_to_buffer(num, buf); |
| chars.insert(buf, buf + len); |
| } |
| |
| template <> |
| inline void CastToString::push_number(const Float64& num, BufferWritable& bw) { |
| char buf[MAX_DOUBLE_STR_LENGTH + 2]; |
| int len = _fast_to_buffer(num, buf); |
| bw.write(buf, len); |
| } |
| |
| // DECIMAL32 |
| template <> |
| inline std::string CastToString::from_decimal(const Decimal32& from, UInt32 scale) { |
| return from.to_string(scale); |
| } |
| |
| template <> |
| inline void CastToString::push_decimal(const Decimal32& from, UInt32 scale, BufferWritable& bw) { |
| std::string str = from.to_string(scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| // DECIMAL64 |
| template <> |
| inline std::string CastToString::from_decimal(const Decimal64& from, UInt32 scale) { |
| return from.to_string(scale); |
| } |
| |
| template <> |
| inline void CastToString::push_decimal(const Decimal64& from, UInt32 scale, BufferWritable& bw) { |
| std::string str = from.to_string(scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| // DECIMAL128 |
| template <> |
| inline std::string CastToString::from_decimal(const Decimal128V3& from, UInt32 scale) { |
| return from.to_string(scale); |
| } |
| |
| template <> |
| inline void CastToString::push_decimal(const Decimal128V3& from, UInt32 scale, BufferWritable& bw) { |
| std::string str = from.to_string(scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| // DECIMAL256 |
| template <> |
| inline std::string CastToString::from_decimal(const Decimal256& from, UInt32 scale) { |
| return from.to_string(scale); |
| } |
| |
| template <> |
| inline void CastToString::push_decimal(const Decimal256& from, UInt32 scale, BufferWritable& bw) { |
| std::string str = from.to_string(scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| // DECIMALV2 |
| template <> |
| inline std::string CastToString::from_decimal(const Decimal128V2& from, UInt32 scale) { |
| auto value = (DecimalV2Value)from; |
| auto str = value.to_string(scale); |
| return str; |
| } |
| |
| template <> |
| inline void CastToString::push_decimal(const Decimal128V2& from, UInt32 scale, BufferWritable& bw) { |
| auto value = (DecimalV2Value)from; |
| std::string str = value.to_string(scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| template <> |
| inline void CastToString::push_decimal(const DecimalV2Value& from, UInt32 scale, |
| BufferWritable& bw) { |
| std::string str = from.to_string(scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| // DATEV1 DATETIMEV1 |
| inline std::string CastToString::from_date_or_datetime(const VecDateTimeValue& from) { |
| char buf[64]; |
| char* pos = from.to_string(buf); |
| // DateTime to_string the end is /0 |
| return std::string(buf, pos - 1); |
| } |
| |
| inline void CastToString::push_date_or_datetime(const VecDateTimeValue& from, |
| ColumnString::Chars& chars) { |
| char buf[64]; |
| char* pos = from.to_string(buf); |
| // DateTime to_string the end is /0 |
| chars.insert(buf, pos - 1); |
| } |
| |
| inline void CastToString::push_date_or_datetime(const VecDateTimeValue& from, BufferWritable& bw) { |
| char buf[64]; |
| char* pos = from.to_string(buf); |
| // DateTime to_string the end is /0 |
| bw.write(buf, pos - buf - 1); |
| } |
| |
| // DATEV2 |
| inline std::string CastToString::from_datev2(const DateV2Value<DateV2ValueType>& from) { |
| char buf[64]; |
| char* pos = from.to_string(buf); |
| // DateTime to_string the end is /0 |
| return std::string(buf, pos - 1); |
| } |
| |
| inline void CastToString::push_datev2(const DateV2Value<DateV2ValueType>& from, |
| ColumnString::Chars& chars) { |
| char buf[64]; |
| char* pos = from.to_string(buf); |
| // DateTime to_string the end is /0 |
| chars.insert(buf, pos - 1); |
| } |
| |
| inline void CastToString::push_datev2(const DateV2Value<DateV2ValueType>& from, |
| BufferWritable& bw) { |
| char buf[64]; |
| char* pos = from.to_string(buf); |
| // DateTime to_string the end is /0 |
| bw.write(buf, pos - buf - 1); |
| } |
| |
| // DATETIMEV2 |
| inline std::string CastToString::from_datetimev2(const DateV2Value<DateTimeV2ValueType>& from, |
| UInt32 scale) { |
| char buf[64]; |
| char* pos = from.to_string(buf, scale); |
| // DateTime to_string the end is /0 |
| return std::string(buf, pos - 1); |
| } |
| |
| inline std::string CastToString::from_timestamptz(const TimestampTzValue& from, UInt32 scale, |
| const cctz::time_zone* timezone) { |
| cctz::time_zone tz; |
| if (timezone == nullptr) { |
| tz = cctz::utc_time_zone(); |
| } else { |
| tz = *timezone; |
| } |
| return from.to_string(tz, scale); |
| } |
| inline void CastToString::push_datetimev2(const DateV2Value<DateTimeV2ValueType>& from, |
| UInt32 scale, ColumnString::Chars& chars) { |
| char buf[64]; |
| char* pos = from.to_string(buf, scale); |
| // DateTime to_string the end is /0 |
| chars.insert(buf, pos - 1); |
| } |
| |
| inline void CastToString::push_datetimev2(const DateV2Value<DateTimeV2ValueType>& from, |
| UInt32 scale, BufferWritable& bw) { |
| char buf[64]; |
| char* pos = from.to_string(buf, scale); |
| // DateTime to_string the end is /0 |
| bw.write(buf, pos - buf - 1); |
| } |
| |
| inline void CastToString::push_timestamptz(const TimestampTzValue& from, UInt32 scale, |
| BufferWritable& bw, |
| const DataTypeSerDe::FormatOptions& options) { |
| auto str = from.to_string(*options.timezone, scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| // IPv4 |
| template <> |
| inline std::string CastToString::from_ip(const IPv4& from) { |
| auto value = IPv4Value(from); |
| return value.to_string(); |
| } |
| |
| template <> |
| inline void CastToString::push_ip(const IPv4& from, BufferWritable& bw) { |
| auto value = IPv4Value(from); |
| std::string str = value.to_string(); |
| bw.write(str.data(), str.size()); |
| } |
| |
| //IPv6 |
| |
| template <> |
| inline std::string CastToString::from_ip(const IPv6& from) { |
| auto value = IPv6Value(from); |
| return value.to_string(); |
| } |
| |
| template <> |
| inline void CastToString::push_ip(const IPv6& from, BufferWritable& bw) { |
| auto value = IPv6Value(from); |
| std::string str = value.to_string(); |
| bw.write(str.data(), str.size()); |
| } |
| |
| // Time |
| inline std::string CastToString::from_time(const TimeValue::TimeType& from, UInt32 scale) { |
| return timev2_to_buffer_from_double(from, scale); |
| } |
| |
| inline void CastToString::push_time(const TimeValue::TimeType& from, UInt32 scale, |
| BufferWritable& bw) { |
| std::string str = timev2_to_buffer_from_double(from, scale); |
| bw.write(str.data(), str.size()); |
| } |
| |
| class CastToStringFunction { |
| public: |
| static Status execute_impl(FunctionContext* context, Block& block, |
| const ColumnNumbers& arguments, uint32_t result, |
| size_t input_rows_count, |
| const NullMap::value_type* null_map = nullptr) { |
| const auto& col_with_type_and_name = block.get_by_position(arguments[0]); |
| const IDataType& type = *col_with_type_and_name.type; |
| const IColumn& col_from = *col_with_type_and_name.column; |
| |
| auto col_to = ColumnString::create(); |
| |
| DataTypeSerDe::FormatOptions options; |
| auto time_zone = cctz::utc_time_zone(); |
| options.timezone = |
| (context && context->state()) ? &context->state()->timezone_obj() : &time_zone; |
| type.get_serde()->to_string_batch(col_from, *col_to, options); |
| |
| block.replace_by_position(result, std::move(col_to)); |
| return Status::OK(); |
| } |
| }; |
| |
| namespace CastWrapper { |
| |
| inline WrapperType create_string_wrapper(const DataTypePtr& from_type) { |
| return [](FunctionContext* context, Block& block, const ColumnNumbers& arguments, |
| uint32_t result, size_t input_rows_count, |
| const NullMap::value_type* null_map = nullptr) { |
| return CastToStringFunction::execute_impl(context, block, arguments, result, |
| input_rows_count, null_map); |
| }; |
| } |
| |
| }; // namespace CastWrapper |
| } // namespace doris |
| #include "common/compile_check_end.h" |