| // Licensed to the Apache Software Foundation (ASF) under one |
| // or more contributor license agreements. See the NOTICE file |
| // distributed with this work for additional information |
| // regarding copyright ownership. The ASF licenses this file |
| // to you under the Apache License, Version 2.0 (the |
| // "License"); you may not use this file except in compliance |
| // with the License. You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, |
| // software distributed under the License is distributed on an |
| // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| // KIND, either express or implied. See the License for the |
| // specific language governing permissions and limitations |
| // under the License. |
| |
| #include "exprs/binary_predicate.h" |
| |
| #include <gtest/gtest.h> |
| |
| #include "common/object_pool.h" |
| #include "exec/exec_node.h" |
| #include "exprs/expr.h" |
| #include "exprs/int_literal.h" |
| #include "gen_cpp/Exprs_types.h" |
| #include "runtime/row_batch.h" |
| #include "runtime/runtime_state.h" |
| #include "runtime/vectorized_row_batch.h" |
| #include "util/debug_util.h" |
| |
| namespace doris { |
| |
| class BinaryOpTest : public ::testing::Test { |
| public: |
| ~BinaryOpTest() {} |
| |
| virtual void SetUp() { |
| _object_pool = new ObjectPool(); |
| _runtime_state = _object_pool->add(new RuntimeState("")); |
| |
| TDescriptorTable ttbl; |
| TTupleDescriptor tuple_desc; |
| tuple_desc.__set_id(0); |
| tuple_desc.__set_byteSize(8); |
| tuple_desc.__set_numNullBytes(0); |
| ttbl.tupleDescriptors.push_back(tuple_desc); |
| |
| TSlotDescriptor slot_desc; |
| slot_desc.__set_id(0); |
| slot_desc.__set_parent(0); |
| slot_desc.__set_slotType(TPrimitiveType::INT); |
| slot_desc.__set_columnPos(0); |
| slot_desc.__set_byteOffset(4); |
| slot_desc.__set_nullIndicatorByte(0); |
| slot_desc.__set_nullIndicatorBit(0); |
| slot_desc.__set_colName("col1"); |
| slot_desc.__set_slotIdx(0); |
| slot_desc.__set_isMaterialized(true); |
| ttbl.slotDescriptors.push_back(slot_desc); |
| |
| DescriptorTbl* desc_tbl = NULL; |
| ASSERT_TRUE(DescriptorTbl::create(_object_pool, ttbl, &desc_tbl).ok()); |
| ASSERT_TRUE(desc_tbl != NULL); |
| _runtime_state->set_desc_tbl(desc_tbl); |
| |
| std::vector<TTupleId> row_tuples; |
| row_tuples.push_back(0); |
| std::vector<bool> nullable_tuples; |
| nullable_tuples.push_back(false); |
| _row_desc = _object_pool->add(new RowDescriptor(*desc_tbl, row_tuples, nullable_tuples)); |
| |
| FieldInfo field; |
| field.name = "col1"; |
| field.type = OLAP_FIELD_TYPE_INT; |
| field.length = 4; |
| field.is_key = true; |
| _schema.push_back(field); |
| } |
| virtual void TearDown() { |
| if (_object_pool != NULL) { |
| delete _object_pool; |
| _object_pool = NULL; |
| } |
| } |
| |
| Expr* create_expr() { |
| TExpr exprs; |
| { |
| TExprNode expr_node; |
| expr_node.__set_node_type(TExprNodeType::BINARY_PRED); |
| TColumnType type; |
| type.__set_type(TPrimitiveType::INT); |
| expr_node.__set_type(type); |
| expr_node.__set_num_children(2); |
| expr_node.__isset.opcode = true; |
| expr_node.__set_opcode(TExprOpcode::LT_INT_INT); |
| expr_node.__isset.vector_opcode = true; |
| expr_node.__set_vector_opcode(TExprOpcode::FILTER_LT_INT_INT); |
| exprs.nodes.push_back(expr_node); |
| } |
| { |
| TExprNode expr_node; |
| expr_node.__set_node_type(TExprNodeType::SLOT_REF); |
| TColumnType type; |
| type.__set_type(TPrimitiveType::INT); |
| expr_node.__set_type(type); |
| expr_node.__set_num_children(0); |
| expr_node.__isset.slot_ref = true; |
| TSlotRef slot_ref; |
| slot_ref.__set_slot_id(0); |
| slot_ref.__set_tuple_id(0); |
| expr_node.__set_slot_ref(slot_ref); |
| expr_node.__isset.output_column = true; |
| expr_node.__set_output_column(0); |
| exprs.nodes.push_back(expr_node); |
| } |
| { |
| TExprNode expr_node; |
| expr_node.__set_node_type(TExprNodeType::INT_LITERAL); |
| TColumnType type; |
| type.__set_type(TPrimitiveType::INT); |
| expr_node.__set_type(type); |
| expr_node.__set_num_children(0); |
| expr_node.__isset.int_literal = true; |
| TIntLiteral int_literal; |
| int_literal.__set_value(10); |
| expr_node.__set_int_literal(int_literal); |
| exprs.nodes.push_back(expr_node); |
| } |
| Expr* root_expr = NULL; |
| |
| if (Expr::create_expr_tree(_object_pool, exprs, &root_expr).ok()) { |
| return root_expr; |
| } else { |
| return NULL; |
| } |
| } |
| |
| public: |
| ObjectPool* object_pool() { return _object_pool; } |
| RuntimeState* runtime_state() { return _runtime_state; } |
| RowDescriptor* row_desc() { return _row_desc; } |
| |
| private: |
| ObjectPool* _object_pool; |
| RuntimeState* _runtime_state; |
| RowDescriptor* _row_desc; |
| std::vector<FieldInfo> _schema; |
| }; |
| |
| TEST_F(BinaryOpTest, PrepareTest) { |
| Expr* expr = create_expr(); |
| ASSERT_TRUE(expr != NULL); |
| ASSERT_TRUE(expr->prepare(runtime_state(), *row_desc()).ok()); |
| } |
| |
| TEST_F(BinaryOpTest, NormalTest) { |
| Expr* expr = create_expr(); |
| ASSERT_TRUE(expr != NULL); |
| ASSERT_TRUE(expr->prepare(runtime_state(), *row_desc()).ok()); |
| int capacity = 256; |
| VectorizedRowBatch* vec_row_batch = |
| object_pool()->add(new VectorizedRowBatch(_schema, capacity)); |
| MemPool* mem_pool = vec_row_batch->mem_pool(); |
| int32_t* vec_data = reinterpret_cast<int32_t*>(mem_pool->allocate(sizeof(int32_t) * capacity)); |
| vec_row_batch->column(0)->set_col_data(vec_data); |
| |
| for (int i = 0; i < capacity; ++i) { |
| vec_data[i] = i; |
| } |
| |
| vec_row_batch->set_size(capacity); |
| expr->evaluate(vec_row_batch); |
| ASSERT_EQ(vec_row_batch->size(), 10); |
| |
| Tuple tuple; |
| int vv = 0; |
| |
| while (vec_row_batch->get_next_tuple(&tuple, |
| *runtime_state()->desc_tbl().get_tuple_descriptor(0))) { |
| ASSERT_EQ(vv++, *reinterpret_cast<int32_t*>(tuple.get_slot(4))); |
| } |
| } |
| |
| TEST_F(BinaryOpTest, SimplePerformanceTest) { |
| ASSERT_EQ(1, _row_desc->tuple_descriptors().size()); |
| for (int capacity = 128; capacity <= 1024 * 128; capacity *= 2) { |
| Expr* expr = create_expr(); |
| ASSERT_TRUE(expr != NULL); |
| ASSERT_TRUE(expr->prepare(runtime_state(), *row_desc()).ok()); |
| int size = 1024 * 1024 / capacity; |
| VectorizedRowBatch* vec_row_batches[size]; |
| srand(time(NULL)); |
| |
| for (int i = 0; i < size; ++i) { |
| vec_row_batches[i] = object_pool()->add(new VectorizedRowBatch(_schema, capacity)); |
| MemPool* mem_pool = vec_row_batches[i]->mem_pool(); |
| int32_t* vec_data = |
| reinterpret_cast<int32_t*>(mem_pool->allocate(sizeof(int32_t) * capacity)); |
| vec_row_batches[i]->column(0)->set_col_data(vec_data); |
| |
| for (int i = 0; i < capacity; ++i) { |
| vec_data[i] = rand() % 20; |
| } |
| |
| vec_row_batches[i]->set_size(capacity); |
| } |
| |
| RowBatch* row_batches[size]; |
| |
| for (int i = 0; i < size; ++i) { |
| row_batches[i] = object_pool()->add(new RowBatch(*row_desc(), capacity)); |
| vec_row_batches[i]->to_row_batch(row_batches[i], |
| *runtime_state()->desc_tbl().get_tuple_descriptor(0)); |
| } |
| |
| MonotonicStopWatch stopwatch; |
| stopwatch.start(); |
| |
| for (int i = 0; i < size; ++i) { |
| expr->evaluate(vec_row_batches[i]); |
| } |
| |
| uint64_t vec_time = stopwatch.elapsed_time(); |
| VLOG_CRITICAL << PrettyPrinter::print(vec_time, TCounterType::TIME_NS); |
| |
| stopwatch.start(); |
| |
| for (int i = 0; i < size; ++i) { |
| for (int j = 0; j < capacity; ++j) { |
| ExecNode::eval_conjuncts(&expr, 1, row_batches[i]->get_row(j)); |
| } |
| } |
| |
| uint64_t row_time = stopwatch.elapsed_time(); |
| VLOG_CRITICAL << PrettyPrinter::print(row_time, TCounterType::TIME_NS); |
| |
| VLOG_CRITICAL << "capacity: " << capacity << " multiple: " << row_time / vec_time; |
| } |
| } |
| |
| } // namespace doris |
| |
| /* vim: set expandtab ts=4 sw=4 sts=4 tw=100: */ |