blob: ebdb0d75e482e37234e4f0c81edb0701fb046030 [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include <gtest/gtest.h>
#include "common/object_pool.h"
#include "exec/exec_node.h"
#include "exprs/expr.h"
#include "exprs/in_predicate.h"
#include "exprs/int_literal.h"
#include "gen_cpp/Exprs_types.h"
#include "runtime/row_batch.h"
#include "runtime/runtime_state.h"
#include "runtime/vectorized_row_batch.h"
#include "util/debug_util.h"
namespace doris {
class InOpTest : public ::testing::Test {
public:
~InOpTest() {}
InOpTest() : _object_pool(NULL), _runtime_state(NULL), _row_desc(NULL) {}
virtual void SetUp() {
_object_pool = new ObjectPool();
_runtime_state = _object_pool->add(new RuntimeState(""));
TDescriptorTable ttbl;
TTupleDescriptor tuple_desc;
tuple_desc.__set_id(0);
tuple_desc.__set_byteSize(8);
tuple_desc.__set_numNullBytes(0);
ttbl.tupleDescriptors.push_back(tuple_desc);
TSlotDescriptor slot_desc;
slot_desc.__set_id(0);
slot_desc.__set_parent(0);
slot_desc.__set_slotType(TPrimitiveType::INT);
slot_desc.__set_columnPos(0);
slot_desc.__set_byteOffset(4);
slot_desc.__set_nullIndicatorByte(0);
slot_desc.__set_nullIndicatorBit(0);
slot_desc.__set_colName("col1");
slot_desc.__set_slotIdx(0);
slot_desc.__set_isMaterialized(true);
ttbl.slotDescriptors.push_back(slot_desc);
DescriptorTbl* desc_tbl = NULL;
ASSERT_TRUE(DescriptorTbl::create(_object_pool, ttbl, &desc_tbl).ok());
ASSERT_TRUE(desc_tbl != NULL);
_runtime_state->set_desc_tbl(desc_tbl);
std::vector<TTupleId> row_tuples;
row_tuples.push_back(0);
std::vector<bool> nullable_tuples;
nullable_tuples.push_back(false);
_row_desc = _object_pool->add(new RowDescriptor(*desc_tbl, row_tuples, nullable_tuples));
}
virtual void TearDown() {
if (_object_pool != NULL) {
delete _object_pool;
_object_pool = NULL;
}
}
Expr* create_expr() {
TExpr exprs;
int num_children = 128;
{
TExprNode expr_node;
expr_node.__set_node_type(TExprNodeType::IN_PRED);
TColumnType type;
type.__set_type(TPrimitiveType::INT);
expr_node.__isset.in_predicate = true;
expr_node.in_predicate.__set_is_not_in(false);
expr_node.__set_type(type);
expr_node.__set_num_children(num_children + 1);
expr_node.__isset.opcode = true;
expr_node.__set_opcode(TExprOpcode::INVALID_OPCODE);
expr_node.__isset.vector_opcode = true;
expr_node.__set_vector_opcode(TExprOpcode::FILTER_IN_INT);
exprs.nodes.push_back(expr_node);
}
{
TExprNode expr_node;
expr_node.__set_node_type(TExprNodeType::SLOT_REF);
TColumnType type;
type.__set_type(TPrimitiveType::INT);
expr_node.__set_type(type);
expr_node.__set_num_children(0);
expr_node.__isset.slot_ref = true;
TSlotRef slot_ref;
slot_ref.__set_slot_id(0);
slot_ref.__set_tuple_id(0);
expr_node.__set_slot_ref(slot_ref);
expr_node.__isset.output_column = true;
expr_node.__set_output_column(0);
exprs.nodes.push_back(expr_node);
}
for (int i = 0; i < num_children; ++i) {
TExprNode expr_node;
expr_node.__set_node_type(TExprNodeType::INT_LITERAL);
TColumnType type;
type.__set_type(TPrimitiveType::INT);
expr_node.__set_type(type);
expr_node.__set_num_children(0);
expr_node.__isset.int_literal = true;
TIntLiteral int_literal;
int_literal.__set_value(i);
expr_node.__set_int_literal(int_literal);
exprs.nodes.push_back(expr_node);
}
Expr* root_expr = NULL;
if (Expr::create_expr_tree(_object_pool, exprs, &root_expr).ok()) {
return root_expr;
} else {
return NULL;
}
}
private:
ObjectPool* _object_pool;
RuntimeState* _runtime_state;
RowDescriptor* _row_desc;
};
TEST_F(InOpTest, PrepareTest) {
Expr* expr = create_expr();
ASSERT_TRUE(expr != NULL);
ASSERT_TRUE(expr->prepare(_runtime_state, *_row_desc).ok());
}
TEST_F(InOpTest, NormalTest) {
Expr* expr = create_expr();
ASSERT_TRUE(expr != NULL);
ASSERT_TRUE(expr->prepare(_runtime_state, *_row_desc).ok());
int capacity = 256;
VectorizedRowBatch* vec_row_batch = _object_pool->add(
new VectorizedRowBatch(*_runtime_state->desc_tbl().get_tuple_descriptor(0), capacity));
MemPool* mem_pool = vec_row_batch->mem_pool();
int32_t* vec_data = reinterpret_cast<int32_t*>(mem_pool->allocate(sizeof(int32_t) * capacity));
vec_row_batch->column(0)->set_col_data(vec_data);
for (int i = 0; i < capacity; ++i) {
vec_data[i] = i;
}
vec_row_batch->set_size(capacity);
expr->evaluate(vec_row_batch);
ASSERT_EQ(vec_row_batch->size(), 128);
Tuple tuple;
int vv = 0;
while (vec_row_batch->get_next_tuple(&tuple)) {
ASSERT_EQ(vv++, *reinterpret_cast<int32_t*>(tuple.get_slot(4)));
}
}
TEST_F(InOpTest, SimplePerformanceTest) {
for (int capacity = 128; capacity <= 1024 * 128; capacity *= 2) {
Expr* expr = create_expr();
ASSERT_TRUE(expr != NULL);
ASSERT_TRUE(expr->prepare(_runtime_state, *_row_desc).ok());
int size = 1024 * 1024 / capacity;
VectorizedRowBatch* vec_row_batches[size];
srand(time(NULL));
for (int i = 0; i < size; ++i) {
vec_row_batches[i] = _object_pool->add(new VectorizedRowBatch(
*_runtime_state->desc_tbl().get_tuple_descriptor(0), capacity));
MemPool* mem_pool = vec_row_batches[i]->mem_pool();
int32_t* vec_data =
reinterpret_cast<int32_t*>(mem_pool->allocate(sizeof(int32_t) * capacity));
vec_row_batches[i]->column(0)->set_col_data(vec_data);
for (int i = 0; i < capacity; ++i) {
vec_data[i] = rand() % 256;
}
vec_row_batches[i]->set_size(capacity);
}
RowBatch* row_batches[size];
for (int i = 0; i < size; ++i) {
row_batches[i] = _object_pool->add(new RowBatch(*_row_desc, capacity));
vec_row_batches[i]->to_row_batch(row_batches[i]);
}
MonotonicStopWatch stopwatch;
stopwatch.start();
for (int i = 0; i < size; ++i) {
expr->evaluate(vec_row_batches[i]);
}
uint64_t vec_time = stopwatch.elapsed_time();
VLOG_CRITICAL << PrettyPrinter::print(vec_time, TCounterType::TIME_NS);
stopwatch.start();
for (int i = 0; i < size; ++i) {
for (int j = 0; j < capacity; ++j) {
ExecNode::eval_conjuncts(&expr, 1, row_batches[i]->get_row(j));
}
}
uint64_t row_time = stopwatch.elapsed_time();
VLOG_CRITICAL << PrettyPrinter::print(row_time, TCounterType::TIME_NS);
VLOG_CRITICAL << "capacity: " << capacity << " multiple: " << row_time / vec_time;
}
}
} // namespace doris
/* vim: set expandtab ts=4 sw=4 sts=4 tw=100: */