blob: 867c71137adb1e05f665d230994736ea337328e0 [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include "olap/rowset/rowset_converter.h"
#include <fstream>
#include <sstream>
#include <string>
#include "boost/filesystem.hpp"
#include "gmock/gmock.h"
#include "gtest/gtest.h"
#include "json2pb/json_to_pb.h"
#include "olap/data_dir.h"
#include "olap/olap_cond.h"
#include "olap/olap_meta.h"
#include "olap/rowset/rowset_factory.h"
#include "olap/rowset/rowset_reader.h"
#include "olap/rowset/rowset_reader_context.h"
#include "olap/rowset/rowset_writer.h"
#include "olap/rowset/rowset_writer_context.h"
#include "olap/storage_engine.h"
#include "olap/tablet_meta.h"
#include "runtime/exec_env.h"
#include "util/file_utils.h"
#include "util/logging.h"
#ifndef BE_TEST
#define BE_TEST
#endif
using ::testing::_;
using ::testing::Return;
using ::testing::SetArgPointee;
using std::string;
namespace doris {
static const uint32_t MAX_PATH_LEN = 1024;
StorageEngine* k_engine = nullptr;
void create_rowset_writer_context(TabletSchema* tablet_schema, RowsetTypePB dst_type,
RowsetWriterContext* rowset_writer_context) {
RowsetId rowset_id;
rowset_id.init(10000);
rowset_writer_context->rowset_id = rowset_id;
rowset_writer_context->tablet_id = 12345;
rowset_writer_context->tablet_schema_hash = 1111;
rowset_writer_context->partition_id = 10;
rowset_writer_context->rowset_type = dst_type;
rowset_writer_context->rowset_path_prefix = config::storage_root_path + "/data/0/12345/1111";
rowset_writer_context->rowset_state = VISIBLE;
rowset_writer_context->tablet_schema = tablet_schema;
rowset_writer_context->version.first = 0;
rowset_writer_context->version.second = 1;
rowset_writer_context->version_hash = 110;
}
void create_rowset_reader_context(TabletSchema* tablet_schema,
const std::vector<uint32_t>* return_columns,
const DeleteHandler* delete_handler,
std::vector<ColumnPredicate*>* predicates,
std::set<uint32_t>* load_bf_columns, Conditions* conditions,
RowsetReaderContext* rowset_reader_context) {
rowset_reader_context->reader_type = READER_ALTER_TABLE;
rowset_reader_context->tablet_schema = tablet_schema;
rowset_reader_context->need_ordered_result = true;
rowset_reader_context->return_columns = return_columns;
rowset_reader_context->seek_columns = return_columns;
rowset_reader_context->delete_handler = delete_handler;
rowset_reader_context->lower_bound_keys = nullptr;
rowset_reader_context->is_lower_keys_included = nullptr;
rowset_reader_context->upper_bound_keys = nullptr;
rowset_reader_context->is_upper_keys_included = nullptr;
rowset_reader_context->predicates = predicates;
rowset_reader_context->load_bf_columns = load_bf_columns;
rowset_reader_context->conditions = conditions;
}
void create_tablet_schema(KeysType keys_type, TabletSchema* tablet_schema) {
TabletSchemaPB tablet_schema_pb;
tablet_schema_pb.set_keys_type(keys_type);
tablet_schema_pb.set_num_short_key_columns(2);
tablet_schema_pb.set_num_rows_per_row_block(1024);
tablet_schema_pb.set_compress_kind(COMPRESS_NONE);
tablet_schema_pb.set_next_column_unique_id(4);
ColumnPB* column_1 = tablet_schema_pb.add_column();
column_1->set_unique_id(1);
column_1->set_name("k1");
column_1->set_type("INT");
column_1->set_is_key(true);
column_1->set_length(4);
column_1->set_index_length(4);
column_1->set_is_nullable(false);
column_1->set_is_bf_column(false);
ColumnPB* column_2 = tablet_schema_pb.add_column();
column_2->set_unique_id(2);
column_2->set_name("k2");
column_2->set_type("VARCHAR");
column_2->set_length(20);
column_2->set_index_length(20);
column_2->set_is_key(true);
column_2->set_is_nullable(false);
column_2->set_is_bf_column(false);
ColumnPB* column_3 = tablet_schema_pb.add_column();
column_3->set_unique_id(3);
column_3->set_name("v1");
column_3->set_type("INT");
column_3->set_length(4);
column_3->set_is_key(false);
column_3->set_is_nullable(false);
column_3->set_is_bf_column(false);
column_3->set_aggregation("SUM");
tablet_schema->init_from_pb(tablet_schema_pb);
}
void create_tablet_meta(TabletSchema* tablet_schema, TabletMeta* tablet_meta) {
TabletMetaPB tablet_meta_pb;
tablet_meta_pb.set_table_id(10000);
tablet_meta_pb.set_tablet_id(12345);
tablet_meta_pb.set_schema_hash(1111);
tablet_meta_pb.set_partition_id(10);
tablet_meta_pb.set_shard_id(0);
tablet_meta_pb.set_creation_time(1575020449);
tablet_meta_pb.set_tablet_state(PB_RUNNING);
PUniqueId* tablet_uid = tablet_meta_pb.mutable_tablet_uid();
tablet_uid->set_hi(10);
tablet_uid->set_lo(10);
TabletSchemaPB* tablet_schema_pb = tablet_meta_pb.mutable_schema();
tablet_schema->to_schema_pb(tablet_schema_pb);
tablet_meta->init_from_pb(tablet_meta_pb);
}
class RowsetConverterTest : public testing::Test {
public:
virtual void SetUp() {
config::tablet_map_shard_size = 1;
config::txn_map_shard_size = 1;
config::txn_shard_size = 1;
config::path_gc_check = false;
char buffer[MAX_PATH_LEN];
getcwd(buffer, MAX_PATH_LEN);
config::storage_root_path = std::string(buffer) + "/data_test";
FileUtils::remove_all(config::storage_root_path);
ASSERT_TRUE(FileUtils::create_dir(config::storage_root_path).ok());
std::vector<StorePath> paths;
paths.emplace_back(config::storage_root_path, -1);
doris::EngineOptions options;
options.store_paths = paths;
if (k_engine == nullptr) {
Status s = doris::StorageEngine::open(options, &k_engine);
ASSERT_TRUE(s.ok()) << s.to_string();
}
ExecEnv* exec_env = doris::ExecEnv::GetInstance();
exec_env->set_storage_engine(k_engine);
std::string data_path = config::storage_root_path + "/data";
ASSERT_TRUE(FileUtils::create_dir(data_path).ok());
std::string shard_path = data_path + "/0";
ASSERT_TRUE(FileUtils::create_dir(shard_path).ok());
std::string tablet_path = shard_path + "/12345";
ASSERT_TRUE(FileUtils::create_dir(tablet_path).ok());
_schema_hash_path = tablet_path + "/1111";
ASSERT_TRUE(FileUtils::create_dir(_schema_hash_path).ok());
_mem_tracker.reset(new MemTracker(-1));
_mem_pool.reset(new MemPool(_mem_tracker.get()));
}
virtual void TearDown() { FileUtils::remove_all(config::storage_root_path); }
void process(RowsetTypePB src_type, RowsetTypePB dst_type);
private:
std::string _schema_hash_path;
std::shared_ptr<MemTracker> _mem_tracker;
std::unique_ptr<MemPool> _mem_pool;
};
void RowsetConverterTest::process(RowsetTypePB src_type, RowsetTypePB dst_type) {
// write
TabletSchema tablet_schema;
create_tablet_schema(AGG_KEYS, &tablet_schema);
RowsetWriterContext rowset_writer_context;
create_rowset_writer_context(&tablet_schema, src_type, &rowset_writer_context);
std::unique_ptr<RowsetWriter> _rowset_writer;
ASSERT_EQ(OLAP_SUCCESS,
RowsetFactory::create_rowset_writer(rowset_writer_context, &_rowset_writer));
RowCursor row;
OLAPStatus res = row.init(tablet_schema);
ASSERT_EQ(OLAP_SUCCESS, res);
std::vector<std::string> test_data;
for (int i = 0; i < 1024; ++i) {
test_data.push_back("well" + std::to_string(i));
int32_t field_0 = i;
row.set_field_content(0, reinterpret_cast<char*>(&field_0), _mem_pool.get());
Slice field_1(test_data[i]);
row.set_field_content(1, reinterpret_cast<char*>(&field_1), _mem_pool.get());
int32_t field_2 = 10000 + i;
row.set_field_content(2, reinterpret_cast<char*>(&field_2), _mem_pool.get());
_rowset_writer->add_row(row);
}
_rowset_writer->flush();
RowsetSharedPtr src_rowset = _rowset_writer->build();
ASSERT_TRUE(src_rowset != nullptr);
RowsetId src_rowset_id;
src_rowset_id.init(10000);
ASSERT_EQ(src_rowset_id, src_rowset->rowset_id());
ASSERT_EQ(1024, src_rowset->num_rows());
// convert
TabletMetaSharedPtr tablet_meta(new TabletMeta());
create_tablet_meta(&tablet_schema, tablet_meta.get());
RowsetConverter rowset_converter(tablet_meta);
RowsetMetaPB dst_rowset_meta_pb;
if (dst_type == BETA_ROWSET) {
ASSERT_EQ(OLAP_SUCCESS,
rowset_converter.convert_alpha_to_beta(src_rowset->rowset_meta(),
_schema_hash_path, &dst_rowset_meta_pb));
} else {
ASSERT_EQ(OLAP_SUCCESS,
rowset_converter.convert_beta_to_alpha(src_rowset->rowset_meta(),
_schema_hash_path, &dst_rowset_meta_pb));
}
ASSERT_EQ(dst_type, dst_rowset_meta_pb.rowset_type());
ASSERT_EQ(12345, dst_rowset_meta_pb.tablet_id());
ASSERT_EQ(1024, dst_rowset_meta_pb.num_rows());
// read
RowsetMetaSharedPtr dst_rowset_meta(new RowsetMeta());
ASSERT_TRUE(dst_rowset_meta->init_from_pb(dst_rowset_meta_pb));
RowsetSharedPtr dst_rowset;
ASSERT_EQ(OLAP_SUCCESS, RowsetFactory::create_rowset(&tablet_schema, _schema_hash_path,
dst_rowset_meta, &dst_rowset));
RowsetReaderSharedPtr dst_rowset_reader;
ASSERT_EQ(OLAP_SUCCESS, dst_rowset->create_reader(&dst_rowset_reader));
RowsetReaderContext rowset_reader_context;
std::set<uint32_t> load_bf_columns;
std::vector<ColumnPredicate*> predicates;
Conditions conditions;
std::vector<uint32_t> return_columns;
for (int i = 0; i < tablet_schema.num_columns(); ++i) {
return_columns.push_back(i);
}
DeleteHandler delete_handler;
create_rowset_reader_context(&tablet_schema, &return_columns, &delete_handler, &predicates,
&load_bf_columns, &conditions, &rowset_reader_context);
res = dst_rowset_reader->init(&rowset_reader_context);
ASSERT_EQ(OLAP_SUCCESS, res);
RowBlock* row_block = nullptr;
res = dst_rowset_reader->next_block(&row_block);
ASSERT_EQ(OLAP_SUCCESS, res);
ASSERT_EQ(1024, row_block->remaining());
RowCursor row_cursor;
row_cursor.init(tablet_schema);
for (int i = 0; i < 1024; ++i) {
row_block->get_row(i, &row_cursor);
ASSERT_EQ(i, *(uint32_t*)row_cursor.cell_ptr(0));
ASSERT_EQ("well" + std::to_string(i), (*(Slice*)row_cursor.cell_ptr(1)).to_string());
ASSERT_EQ(10000 + i, *(uint32_t*)row_cursor.cell_ptr(2));
}
}
TEST_F(RowsetConverterTest, TestConvertAlphaRowsetToBeta) {
process(ALPHA_ROWSET, BETA_ROWSET);
}
TEST_F(RowsetConverterTest, TestConvertBetaRowsetToAlpha) {
process(ALPHA_ROWSET, BETA_ROWSET);
}
} // namespace doris
int main(int argc, char** argv) {
doris::StoragePageCache::create_global_cache(1 << 30, 0.1);
::testing::InitGoogleTest(&argc, argv);
return RUN_ALL_TESTS();
}