blob: 4abf25a99290e24067eea96e36c5c23759adcb82 [file] [log] [blame]
#!/bin/env python
# -*- coding: utf-8 -*-
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
############################################################################
#
# @file test_sys_partition_basic.py
# @date 2015/05/13 15:26:21
# @brief This file is a test file for palo data loading and verifying.
#
#############################################################################
"""
按照所有支持分区的数据类型进行分区建表,对查询结果进行正确性校验
"""
from data import partition as DATA
from lib import palo_config
from lib import palo_client
from lib import util
import random
LOG = palo_client.LOG
L = palo_client.L
config = palo_config.config
broker_info = palo_config.broker_info
def setup_module():
"""
setUp
"""
global client
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
def check_partition_list(table_name, partition_name_list):
"""
验证分区是否创建成功
"""
for partition_name in partition_name_list:
assert client.get_partition(table_name, partition_name)
def check_load_and_verify(table_name, partition_name_list):
"""
验证表是否创建成功,分区是否创建成功,导入数据,校验
"""
data_desc_list = palo_client.LoadDataInfo(DATA.file_path_1, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
assert client.verify(DATA.expected_data_file_list_1, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
assert client.verify(list(DATA.expected_data_file_list_1) * 2, table_name)
def partition_check(table_name, column_name, partition_name_list, \
partition_value_list, distribution_type, bucket_num, storage_type):
"""
检查,验证
"""
partition_info = palo_client.PartitionInfo(column_name, \
partition_name_list, partition_value_list)
distribution_info = palo_client.DistributionInfo(distribution_type, bucket_num)
client.create_table(table_name, DATA.schema_1, \
partition_info, distribution_info)
assert client.show_tables(table_name)
check_partition_list(table_name, partition_name_list)
check_load_and_verify(table_name, partition_name_list)
def test_partition_by_tinyint_random_column_1():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_column_1",
"describe": "tinyint分区, 边界值,random, random_bucket_num, column",
"tag": "system,p0,fuzz"
}
"""
"""
tinyint分区, 边界值,random, random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k1', \
partition_name_list, partition_value_list, \
'RANDOM', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_tinyint_random_hash_1():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_1",
"describe": "tinyint分区, 边界值,hash(分区列), random_bucket_num, column",
"tag": "system,p1,fuzz"
}
"""
"""
tinyint分区, 边界值,hash(分区列), random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k1', \
partition_name_list, partition_value_list, \
'HASH(k1)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_tinyint_random_hash_2():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_2",
"describe": "tinyint分区, 边界值,hash(非分区列), random_bucket_num, column",
"tag": "system,p0,fuzz"
}
"""
"""
tinyint分区, 边界值,hash(非分区列), random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k1', \
partition_name_list, partition_value_list, \
'HASH(k2)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_tinyint_random_hash_3():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_3",
"describe": "tinyint分区, 边界值,hash(所有非分区列), random_bucket_num, column",
"tag": "system,p0,fuzz"
}
"""
"""
tinyint分区, 边界值,hash(所有非分区列), random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k1', \
partition_name_list, partition_value_list, \
'HASH(k2, k3, k4, k5)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_tinyint_random_hash_4():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_4",
"describe": "tinyint分区, 边界值,hash(所有列), random_bucket_num, column",
"tag": "system,p0,fuzz"
}
"""
"""
tinyint分区, 边界值,hash(所有列), random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k1', \
partition_name_list, partition_value_list, \
'HASH(k1, k2, k3, k4, k5)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_tinyint_random_hash_5():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_5",
"describe": " tinyint分区, 边界值,hash(部分非分区列), random_bucket_num, column",
"tag": "system,p1,fuzz"
}
"""
"""
tinyint分区, 边界值,hash(部分非分区列), random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k1', \
partition_name_list, partition_value_list, \
'HASH(k3, k4, k5)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_smallint():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_smallint",
"describe": "smallint分区",
"tag": "system,p1"
}
"""
"""
smallint分区
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', 'partition_d']
partition_value_list = ['10', '20', '30', 'MAXVALUE']
partition_check(table_name, 'k2', partition_name_list, \
partition_value_list, 'RANDOM', 13, 'column')
client.clean(database_name)
def test_partition_by_smallint_over_range():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_smallint_over_range",
"describe": "smallint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column",
"tag": "system,p1,fuzz"
}
"""
"""
smallint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = [str(-2 ** 15 + 1), str(-2 ** 15 + 2), \
'0', '1', str(2 ** 15 - 2), str(2 ** 15 - 1)]
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k2', \
partition_name_list, partition_value_list, \
'HASH(k4, k5, k1)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_int():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_int",
"describe": "int分区",
"tag": "system,p1"
}
"""
"""
int分区
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', 'partition_d']
partition_value_list = ['100', '200', '300', 'MAXVALUE']
partition_check(table_name, 'k3', partition_name_list, \
partition_value_list, 'RANDOM', 13, 'column')
client.clean(database_name)
def test_partition_by_int_over_range():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_int_over_range",
"describe": "int分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column",
"tag": "system,p1,fuzz"
}
"""
"""
int分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = [str(-2 ** 31 + 1), str(-2 ** 31 + 2), \
'0', '1', str(2 ** 31 - 2), str(2 ** 31 - 1)]
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k3', \
partition_name_list, partition_value_list, \
'HASH(k2, k4, k5, k1)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_bigint():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_bigint",
"describe": "bigint分区",
"tag": "system,p1"
}
"""
"""
bigint分区
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', 'partition_d']
partition_value_list = ['1000', '2000', '3000', 'MAXVALUE']
partition_check(table_name, 'k4', partition_name_list, \
partition_value_list, 'RANDOM', 13, 'column')
client.clean(database_name)
def test_partition_by_bigint_over_range():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_bigint_over_range",
"describe": "bigint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column",
"tag": "system,p1,fuzz"
}
"""
"""
bigint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
'partition_d', 'partition_e', 'partition_f']
partition_value_list = [str(-2 ** 63 + 1), str(-2 ** 63 + 2), \
'0', '1', str(2 ** 63 - 2), str(2 ** 63 - 1)]
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k4', \
partition_name_list, partition_value_list, \
'HASH(k2, k5, k1)', random_bucket_num, 'column')
client.clean(database_name)
def test_partition_by_bigint_one_partition():
"""
{
"title": "test_sys_partition_basic_a.test_partition_by_bigint_one_partition",
"describe": "bigint分区, 一个分区",
"tag": "system,p1"
}
"""
"""
bigint分区, 一个分区
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a']
partition_value_list = [str(2 ** 63 - 1)]
random_bucket_num = random.randrange(1, 300)
LOG.info(L('', random_bucket_num=random_bucket_num))
partition_check(table_name, 'k4', \
partition_name_list, partition_value_list, \
'HASH(k2, k5, k1)', random_bucket_num, 'column')
client.clean(database_name)
def teardown_module():
"""
tearDown
"""
pass
if __name__ == '__main__':
setup_module()
print(broker_info)
test_partition_by_int()