blob: f3e5b43b35d3d9c0c782cc4735ff28e14003b73c [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include <glog/logging.h>
#include <stddef.h>
#include <boost/uuid/random_generator.hpp>
#include <boost/uuid/uuid_io.hpp>
#include <memory>
#include <string>
#include <utility>
#include "common/status.h"
#include "vec/aggregate_functions/aggregate_function.h"
#include "vec/columns/column_string.h"
#include "vec/common/string_utils/string_utils.h"
#include "vec/core/block.h"
#include "vec/core/column_numbers.h"
#include "vec/core/types.h"
#include "vec/data_types/data_type_string.h"
#include "vec/functions/function.h"
#include "vec/functions/function_totype.h"
#include "vec/functions/simple_function_factory.h"
namespace doris {
class FunctionContext;
} // namespace doris
namespace doris::vectorized {
class Uuid : public IFunction {
public:
static constexpr auto name = "uuid";
static constexpr size_t uuid_length = 36; //uuid fixed length
static FunctionPtr create() { return std::make_shared<Uuid>(); }
String get_name() const override { return name; }
bool use_default_implementation_for_constants() const override { return false; }
size_t get_number_of_arguments() const override { return 0; }
bool is_variadic() const override { return false; }
DataTypePtr get_return_type_impl(const DataTypes& arguments) const override {
return std::make_shared<DataTypeString>();
}
Status execute_impl(FunctionContext* context, Block& block, const ColumnNumbers& arguments,
uint32_t result, size_t input_rows_count) const override {
auto col_res = ColumnString::create();
col_res->get_offsets().reserve(input_rows_count);
col_res->get_chars().reserve(input_rows_count * uuid_length);
boost::uuids::random_generator generator;
for (int i = 0; i < input_rows_count; i++) {
std::string uuid = boost::uuids::to_string(generator());
DCHECK(uuid.length() == uuid_length);
col_res->insert_data_without_reserve(uuid.c_str(), uuid.length());
}
block.replace_by_position(result, std::move(col_res));
return Status::OK();
}
};
struct NameIsUuid {
static constexpr auto name = "is_uuid";
};
struct IsUuidImpl {
using ReturnType = DataTypeBool;
using ReturnColumnType = ColumnUInt8;
static constexpr auto PrimitiveTypeImpl = PrimitiveType::TYPE_STRING;
static constexpr size_t uuid_without_dash_length = 32;
static constexpr size_t uuid_with_dash_length = 36;
static constexpr size_t uuid_with_braces_and_dash_length = 38;
static constexpr size_t dash_positions[4] = {8, 13, 18, 23};
static bool is_uuid_with_dash(const char* src, const char* end) {
size_t str_size = end - src;
for (int i = 0; i < str_size; ++i) {
if (!is_hex_ascii(src[i])) {
if (i == dash_positions[0] || i == dash_positions[1] || i == dash_positions[2] ||
i == dash_positions[3]) {
if (src[i] != '-') {
return false;
}
} else {
return false;
}
}
}
return true;
}
static Status vector(const ColumnString::Chars& data, const ColumnString::Offsets& offsets,
PaddedPODArray<UInt8>& res) {
size_t rows_count = offsets.size();
res.resize(rows_count);
for (size_t i = 0; i < rows_count; ++i) {
const char* source = reinterpret_cast<const char*>(&data[offsets[i - 1]]);
int str_size = offsets[i] - offsets[i - 1];
if (str_size == uuid_without_dash_length) {
bool is_valid = true;
for (int j = 0; j < str_size; ++j) {
if (!is_hex_ascii(source[j])) {
is_valid = false;
break;
}
}
res[i] = is_valid;
} else if (str_size == uuid_with_dash_length) {
res[i] = is_uuid_with_dash(source, source + str_size);
} else if (str_size == uuid_with_braces_and_dash_length) {
if (source[0] != '{' || source[str_size - 1] != '}') {
res[i] = 0;
continue;
}
res[i] = is_uuid_with_dash(source + 1, source + str_size - 1);
} else {
res[i] = 0;
}
}
return Status::OK();
}
};
using FunctionIsUuid = FunctionUnaryToType<IsUuidImpl, NameIsUuid>;
void register_function_uuid(SimpleFunctionFactory& factory) {
factory.register_function<Uuid>();
factory.register_function<FunctionIsUuid>();
}
} // namespace doris::vectorized