| // Licensed to the Apache Software Foundation (ASF) under one |
| // or more contributor license agreements. See the NOTICE file |
| // distributed with this work for additional information |
| // regarding copyright ownership. The ASF licenses this file |
| // to you under the Apache License, Version 2.0 (the |
| // "License"); you may not use this file except in compliance |
| // with the License. You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, |
| // software distributed under the License is distributed on an |
| // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| // KIND, either express or implied. See the License for the |
| // specific language governing permissions and limitations |
| // under the License. |
| |
| #pragma once |
| |
| #include <variant> |
| #include <vector> |
| |
| #include "vec/common/hash_table/hash_map_util.h" |
| |
| namespace doris { |
| |
| struct RowRefWithFlag { |
| bool visited; |
| uint32_t row_num = 0; |
| RowRefWithFlag() = default; |
| #include "common/compile_check_avoid_begin.h" |
| //To consider performance, checks are avoided here. |
| RowRefWithFlag(size_t row_num_count, bool is_visited = false) |
| : visited(is_visited), row_num(row_num_count) {} |
| #include "common/compile_check_avoid_end.h" |
| }; |
| |
| template <typename T> |
| using SetData = PHHashMap<T, RowRefWithFlag, HashCRC32<T>>; |
| |
| template <typename T> |
| using SetFixedKeyHashTableContext = vectorized::MethodKeysFixed<SetData<T>>; |
| |
| template <typename T> |
| using SetPrimaryTypeHashTableContext = vectorized::MethodOneNumber<T, SetData<T>>; |
| |
| template <typename T> |
| using SetPrimaryTypeHashTableContextNullable = vectorized::MethodSingleNullableColumn< |
| vectorized::MethodOneNumber<T, vectorized::DataWithNullKey<SetData<T>>>>; |
| |
| using SetSerializedHashTableContext = |
| vectorized::MethodSerialized<PHHashMap<StringRef, RowRefWithFlag>>; |
| using SetMethodOneString = vectorized::MethodStringNoCache<PHHashMap<StringRef, RowRefWithFlag>>; |
| |
| using SetHashTableVariants = |
| std::variant<std::monostate, SetSerializedHashTableContext, SetMethodOneString, |
| SetPrimaryTypeHashTableContextNullable<vectorized::UInt8>, |
| SetPrimaryTypeHashTableContextNullable<vectorized::UInt16>, |
| SetPrimaryTypeHashTableContextNullable<vectorized::UInt32>, |
| SetPrimaryTypeHashTableContextNullable<vectorized::UInt64>, |
| SetPrimaryTypeHashTableContextNullable<vectorized::UInt128>, |
| SetPrimaryTypeHashTableContextNullable<vectorized::UInt256>, |
| SetPrimaryTypeHashTableContext<vectorized::UInt8>, |
| SetPrimaryTypeHashTableContext<vectorized::UInt16>, |
| SetPrimaryTypeHashTableContext<vectorized::UInt32>, |
| SetPrimaryTypeHashTableContext<vectorized::UInt64>, |
| SetPrimaryTypeHashTableContext<vectorized::UInt128>, |
| SetPrimaryTypeHashTableContext<vectorized::UInt256>, |
| SetFixedKeyHashTableContext<vectorized::UInt64>, |
| SetFixedKeyHashTableContext<vectorized::UInt128>, |
| SetFixedKeyHashTableContext<vectorized::UInt256>, |
| SetFixedKeyHashTableContext<vectorized::UInt136>>; |
| |
| struct SetDataVariants |
| : public DataVariants<SetHashTableVariants, vectorized::MethodSingleNullableColumn, |
| vectorized::MethodOneNumber, vectorized::DataWithNullKey> { |
| void init(const std::vector<vectorized::DataTypePtr>& data_types, HashKeyType type) { |
| bool nullable = data_types.size() == 1 && data_types[0]->is_nullable(); |
| switch (type) { |
| case HashKeyType::serialized: |
| method_variant.emplace<SetSerializedHashTableContext>(); |
| break; |
| case HashKeyType::int8_key: |
| emplace_single<vectorized::UInt8, SetData<vectorized::UInt8>>(nullable); |
| break; |
| case HashKeyType::int16_key: |
| emplace_single<vectorized::UInt16, SetData<vectorized::UInt16>>(nullable); |
| break; |
| case HashKeyType::int32_key: |
| emplace_single<vectorized::UInt32, SetData<vectorized::UInt32>>(nullable); |
| break; |
| case HashKeyType::int64_key: |
| emplace_single<vectorized::UInt64, SetData<vectorized::UInt64>>(nullable); |
| break; |
| case HashKeyType::int128_key: |
| emplace_single<vectorized::UInt128, SetData<vectorized::UInt128>>(nullable); |
| break; |
| case HashKeyType::int256_key: |
| emplace_single<vectorized::UInt256, SetData<vectorized::UInt256>>(nullable); |
| break; |
| case HashKeyType::string_key: |
| method_variant.emplace<SetMethodOneString>(); |
| break; |
| case HashKeyType::fixed64: |
| method_variant.emplace<SetFixedKeyHashTableContext<vectorized::UInt64>>( |
| get_key_sizes(data_types)); |
| break; |
| case HashKeyType::fixed128: |
| method_variant.emplace<SetFixedKeyHashTableContext<vectorized::UInt128>>( |
| get_key_sizes(data_types)); |
| break; |
| case HashKeyType::fixed136: |
| method_variant.emplace<SetFixedKeyHashTableContext<vectorized::UInt136>>( |
| get_key_sizes(data_types)); |
| break; |
| case HashKeyType::fixed256: |
| method_variant.emplace<SetFixedKeyHashTableContext<vectorized::UInt256>>( |
| get_key_sizes(data_types)); |
| break; |
| default: |
| throw Exception(ErrorCode::INTERNAL_ERROR, |
| "SetDataVariants meet invalid key type, type={}", type); |
| } |
| } |
| }; |
| |
| } // namespace doris |