blob: 189ab8617faf85e2320741356883de86b5acb3c2 [file] [log] [blame]
#!/bin/env python
# -*- coding: utf-8 -*-
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
"""
/***************************************************************************
*
* @file test_sys_null.py
* @date 2016/04/01 15:26:21
* @brief Test for function - "NULL".
*
**************************************************************************/
"""
import pytest
from data import support_null as DATA
from lib import palo_client
from lib import util
from lib import palo_config
from lib import common
config = palo_config.config
LOG = palo_client.LOG
L = palo_client.L
broker_info = palo_config.broker_info
def setup_module():
"""
setUp
"""
pass
def test_shortkey_null_a():
"""
{
"title": "test_sys_null.test_shortkey_null_a",
"describe": "shortkey列为NULL",
"tag": "system,p1"
}
"""
"""
shortkey列为NULL
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name,
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.use(database_name)
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_1, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_1, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k1 nulls last, k2 nulls last, k3, k4, k5' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_list_data_1, sql=sql, client=client)
client.clean(database_name)
def test_shortkey_null_b():
"""
{
"title": "test_sys_null.test_shortkey_null_b",
"describe": "shortkey列为not NULL",
"tag": "system,p1,fuzz"
}
"""
"""
shortkey列为not NULL
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name,
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_1, storage_type='column')
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_2, table_name)
assert not client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
client.clean(database_name)
@pytest.mark.skip()
def test_null_kv():
"""
{
"title": "test_sys_null.test_null_kv",
"describe": "定长类型和变长类型共12种数据类型为key和value时,指定为NULL列,导入含有NULL值的数据,验证数据正确性",
"tag": "autotest"
}
"""
"""
定长类型和变长类型共12种数据类型为key和value时,指定为NULL列,导入含有NULL值的数据,验证数据正确性
"""
# not null列, 非Null数据导入,校验
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', )
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_3, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k1' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_list_data_2, sql=sql, client=client)
client.clean(database_name)
def test_order_by():
"""
{
"title": "test_sys_null.test_order_by",
"describe": "测试排序",
"tag": "system,p1"
}
"""
"""
测试排序
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
client.clean(database_name)
def test_null_all():
"""
{
"title": "test_sys_null.test_null_all",
"describe": "一行数据中,多个连续key和value列为NULL值,所有key列为NULL,验证聚合正确,验证数据正确,导入多条数据,这些数据的key列部分相同且含有NULL,验证导入后的聚合结果是否正确",
"tag": "system,p1"
}
"""
"""
一行数据中,多个连续key和value列为NULL值
所有key列为NULL,验证聚合正确,验证数据正确
导入多条数据,这些数据的key列部分相同且含有NULL,验证导入后的聚合结果是否正确
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_5, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ' \
'ORDER BY k2 nulls last, k1, k3, k4, k5, k6, k7, k8, k9, k10' \
% (database_name, table_name)
assert common.check_by_file(DATA.expected_file_5, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s WHERE K5 is NULL' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_5_1, sql=sql, client=client)
client.clean(database_name)
@pytest.mark.skip()
def test_empty_string():
"""
{
"title": "test_sys_null.test_empty_string",
"describe": "导入empty field代表空字符串,验证数据正确,空串的replace类型,聚合结果不符合预期",
"tag": "autotest"
}
"""
"""
导入empty field代表空字符串,验证数据正确
空串的replace类型,聚合结果不符合预期
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_6, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ' \
'ORDER BY k2, k1, k3, k4, k5, k6, k7, k8, k9, k10' \
% (database_name, table_name)
assert common.check_by_file(DATA.expected_file_6, sql=sql, client=client)
def test_partition_col_null_hash():
"""
{
"title": "test_sys_null.test_partition_col_null_hash",
"describe": "partition列为NULL,分布方式为hash,hash列为NULL",
"tag": "system,p1"
}
"""
"""
partition列为NULL,分布方式为hash
hash列为NULL
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
partition_name_list = ['partition_a', 'partition_b', 'partition_c', 'partition_d']
partition_value_list = ['-5000', '0', '3000', 'MAXVALUE']
partition_info = palo_client.PartitionInfo('k5', \
partition_name_list, partition_value_list)
distribution_info = palo_client.DistributionInfo('hash(k1, k2, k3)', 13)
client.create_table(table_name, DATA.schema_2, \
partition_info, distribution_info, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ' \
'ORDER BY k2 nulls last, k1 nulls last, k3, k4, k5, k6, k7, k8, k9, k10' \
% (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
client.clean(database_name)
def test_define_as():
"""
{
"title": "test_sys_null.test_define_as",
"describe": "通过NULL DEFINE AS指定特定的字符代表NULL,导入含有特定字符的数据,验证数据正确性",
"tag": "system,p1,fuzz"
}
"""
"""
通过NULL DEFINE AS指定特定的字符代表NULL,导入含有特定字符的数据,验证数据正确性
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
property_list = ["k1 = replace_value('\\\\0xU', NULL)", \
"k2 = replace_value('\\\\0xU', NULL)", \
"k3 = replace_value('\\\\0xU', NULL)", \
"k4 = replace_value('\\\\0xN', NULL)"]
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_7, table_name, set_list=property_list)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
#property_list = property_list,
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_7, sql=sql, client=client)
client.clean(database_name)
@pytest.mark.skip()
def test_null_be():
"""
{
"title": "test_sys_null.test_null_be",
"describe": "导入后,触发BE/CE,验证数据正确性, disable",
"tag": "autotest"
}
"""
"""
导入后,触发BE/CE,验证数据正确性
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
assert client.use(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
label_1 = 'label_1'
label_2 = 'label_2'
label_3 = 'label_3'
label_4 = 'label_4'
label_5 = 'label_5'
data_desc_list_1 = palo_client.LoadDataInfo(DATA.hdfs_file_8_1, table_name)
data_desc_list_2 = palo_client.LoadDataInfo(DATA.hdfs_file_8_2, table_name)
data_desc_list_3 = palo_client.LoadDataInfo(DATA.hdfs_file_8_3, table_name)
data_desc_list_4 = palo_client.LoadDataInfo(DATA.hdfs_file_8_4, table_name)
data_desc_list_5 = palo_client.LoadDataInfo(DATA.hdfs_file_8_5, table_name)
assert client.batch_load(label_1, data_desc_list_1, broker=broker_info)
assert client.batch_load(label_2, data_desc_list_2, broker=broker_info)
assert client.batch_load(label_3, data_desc_list_3, broker=broker_info)
assert client.batch_load(label_4, data_desc_list_4, broker=broker_info)
assert client.batch_load(label_5, data_desc_list_5, broker=broker_info)
assert client.wait_load_job(label_1)
assert client.wait_load_job(label_2)
assert client.wait_load_job(label_3)
assert client.wait_load_job(label_4)
assert client.wait_load_job(label_5)
tablet_id, host_name = client.get_tablet_id_and_be_host_list(table_name)[0]
print(tablet_id, host_name)
# assert env.wait_be(host_name, tablet_id)
sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_8, sql=sql, client=client)
def test_schema_change_add_null():
"""
{
"title": "test_sys_null.test_schema_change_add_null",
"describe": "增加新列为NULL列",
"tag": "system,p1"
}
"""
"""
增加新列为NULL列
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
column_list = [('v11', 'INT', 'SUM'),]
assert client.schema_change_add_column(table_name, column_list, \
after_column_name='v10', is_wait_job=True, set_null=True)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_9, sql=sql, client=client)
client.clean(database_name)
"""
# disable check be/ce
tablet_id, host_name = client.get_tablet_id_and_be_host_list(table_name)[0]
print(tablet_id, host_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
#assert env.restart_be(host_name)
assert env.wait_be(host_name, tablet_id)
assert client.verify_without_schema(sql, DATA.expected_file_9)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_9_1, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True)
sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
assert client.verify_without_schema(sql, DATA.expected_file_9_1)
"""
def test_schema_change_add_key_null():
"""
{
"title": "test_sys_null.test_schema_change_add_key_null",
"describe": "增加新列为NULL列",
"tag": "system,p1"
}
"""
"""
增加新列为NULL列
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
column_list = [('add_key', 'INT', None),]
assert client.schema_change_add_column(table_name, column_list,
after_column_name='k2', is_wait_job=True, set_null=True)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_10, sql=sql, client=client)
set_list = ['add_key = replace_value("None", NULL)']
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_10_1, table_name, set_list=set_list)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_10_1, sql=sql, client=client)
client.clean(database_name)
def test_schema_change_add_key_not_null():
"""
{
"title": "test_sys_null.test_schema_change_add_key_not_null",
"describe": "增加新列为NULL列",
"tag": "system,p1"
}
"""
"""
增加新列为NULL列
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
column_list = [('add_key', 'INT', None, '1'),]
assert client.schema_change_add_column(table_name, column_list,
after_column_name='k2', is_wait_job=True, set_null=False)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_n10, sql=sql, client=client)
# set_list = ['add_key = replace_value("None", NULL)']
# data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_10_1, table_name, set_list=set_list)
column_list = ['k1', 'k2', 'add_key', 'k3', 'k4', 'k5', 'k6', 'k7', 'k8', 'k9', 'k10', 'v1',
'v2', 'v3', 'v4', 'v5', 'v6', 'v7', 'v8', 'v9']
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_10_1, table_name,
column_name_list=column_list)
assert not client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_n10, sql=sql, client=client)
client.clean(database_name)
def test_not_null():
"""
{
"title": "test_sys_null.test_not_null",
"describe": "not null约束, 删除NOT NULL约束,导入NULL数据",
"tag": "system,p1,fuzz"
}
"""
"""
not null约束
删除NOT NULL约束,导入NULL数据
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
distribution_info = palo_client.DistributionInfo('HASH(k3)', 5)
client.create_table(table_name, DATA.schema_3, storage_type='column',
distribution_info=distribution_info)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert not client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
assert client.schema_change_modify_column(table_name, 'k1', 'TINYINT NULL',
is_wait_job=True, is_wait_delete_old_schema=True)
assert client.schema_change_modify_column(table_name, 'k2', 'SMALLINT NULL', \
is_wait_job=True, is_wait_delete_old_schema=True)
assert client.schema_change_modify_column(table_name, 'k4', 'BIGINT NULL', is_wait_job=True)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
client.clean(database_name)
@pytest.mark.skip()
def test_schema_change_order_by():
"""
{
"title": "test_sys_null.test_schema_change_order_by",
"describe": "重排序导致shortkey列变化,NULL列提前,导入数据,验证数据正确",
"tag": "autotest"
}
"""
"""
重排序导致shortkey列变化,NULL列提前,导入数据,验证数据正确
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
# column_list = [('add_key', 'INT', None),]
# assert client.schema_change_add_column(table_name, column_list, \
# after_column_name='k2', is_wait_job=True)
# sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
# assert client.verify_without_schema(sql, DATA.expected_file_10)
column_name_list = ['k10', 'k5', 'k1', 'k2', 'k3', 'k4', \
'k6', 'k7', 'k8', 'k9', 'v5', 'v1', 'v2', 'v3', 'v4', 'v7', 'v8', 'v6', 'v9', 'v10']
assert client.schema_change_order_column(table_name, column_name_list, is_wait_job=True)
sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_11, sql=sql, client=client)
"""
# disable check be
tablet_id, host_name = client.get_tablet_id_and_be_host_list(table_name)[0]
print(tablet_id, host_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
#assert env.restart_be(host_name)
assert env.wait_be(host_name, tablet_id)
sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
assert client.verify_without_schema(sql, DATA.expected_file_11)
"""
def test_rollup():
"""
{
"title": "test_sys_null.test_rollup",
"describe": "创建含有NULL列的rollup表,导入数据,验证命中rollup表的查询结果正确",
"tag": "system,p1"
}
"""
"""
创建含有NULL列的rollup表,导入数据,验证命中rollup表的查询结果正确
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.use(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
rollup_field = ['k4', 'k1', 'k3', 'k2', 'v1']
client.create_rollup_table(table_name, index_name, rollup_field, is_wait=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
assert client.get_index(table_name, index_name=index_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_12, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
#sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
#assert client.verify_without_schema(sql, DATA.expected_file_4)
sql = 'SELECT k4, k1, k3, k2, SUM(v1) ' \
'FROM %s GROUP BY k4, k1, k3, k2 ORDER BY k1' % (table_name)
shoot_table = common.get_explain_rollup(client, sql)
LOG.info(L('shoot table:', shoot_table=shoot_table))
assert index_name in shoot_table
sql = 'SELECT k4, k1, k3, k2, SUM(v1) FROM %s ' \
'GROUP BY k4, k1, k3, k2 ORDER BY k1 nulls last, k2 nulls last' % (table_name)
# ORDER BY K1
assert common.check_by_file(DATA.expected_file_12, sql=sql, client=client)
client.clean(database_name)
@pytest.mark.skip()
def test_load_rollup():
"""
{
"title": "test_sys_null.test_load_rollup",
"describe": "创建含有NULL列的rollup表,导入数据,验证命中rollup表的查询结果正确",
"tag": "autotest"
}
"""
"""
创建含有NULL列的rollup表,导入数据,验证命中rollup表的查询结果正确
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.use(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_12, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
rollup_field = ['k4', 'k1', 'k3', 'k2', 'v1']
client.create_rollup_table(table_name, index_name, rollup_field, is_wait=True)
assert client.get_index(table_name, index_name=index_name)
#sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
#assert client.verify_without_schema(sql, DATA.expected_file_4)
sql = 'SELECT k4, k1, k3, k2, SUM(v1) FROM %s ' \
'GROUP BY k4, k1, k3, k2 ORDER BY k1' % (table_name)
shoot_table = common.get_explain_rollup(client, sql)
LOG.info(L('shoot table:', shoot_table=shoot_table))
assert index_name in shoot_table, 'expect rollup %s, but %s' % (index_name, shoot_table)
sql = 'SELECT k4, k1, k3, k2, SUM(v1) FROM %s ' \
'GROUP BY k4, k1, k3, k2 ORDER BY k1, k2' % (table_name)
assert common.check_by_file(DATA.expected_file_12, sql=sql, client=client)
"""
# disable check be
tablet_id, host_name = client.get_tablet_id_and_be_host_list(table_name)[0]
print(tablet_id, host_name)
time.sleep(15)
assert client.delete(table_name, [('k1', '>', '126'),], table_name)
# time.sleep(2)
# assert client.delete(table_name, [('k1', '>', '127'),], table_name)
# time.sleep(2)
# assert client.delete(table_name, [('k1', '>', '127'),], table_name)
# time.sleep(2)
# assert client.delete(table_name, [('k1', '>', '127'),], table_name)
# time.sleep(2)
# assert client.delete(table_name, [('k1', '>', '127'),], table_name)
# assert env.wait_be(host_name, tablet_id)
# sql = 'SELECT k4, k1, k3, k2, SUM(v1) FROM %s ' \
# 'GROUP BY k4, k1, k3, k2 ORDER BY k1' % (table_name)
# # ORDER BY K1
# assert client.verify_without_schema(sql, DATA.expected_file_12)
"""
@pytest.mark.skip()
def test_delete():
"""
{
"title": "test_sys_null.test_delete",
"describe": "测试delete",
"tag": "autotest"
}
"""
"""
测试delete
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
assert client.use(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
label_1 = 'label_1'
label_2 = 'label_2'
label_3 = 'label_3'
label_4 = 'label_4'
label_5 = 'label_5'
data_desc_list_1 = palo_client.LoadDataInfo(DATA.hdfs_file_8_1, table_name)
data_desc_list_2 = palo_client.LoadDataInfo(DATA.hdfs_file_8_2, table_name)
data_desc_list_3 = palo_client.LoadDataInfo(DATA.hdfs_file_8_3, table_name)
data_desc_list_4 = palo_client.LoadDataInfo(DATA.hdfs_file_8_4, table_name)
data_desc_list_5 = palo_client.LoadDataInfo(DATA.hdfs_file_8_5, table_name)
assert client.batch_load(label_1, data_desc_list_1, broker=broker_info)
assert client.wait_load_job(label_1)
assert client.delete(table_name, [('k5', '=', '-90000'),], table_name)
assert client.batch_load(label_2, data_desc_list_2, broker=broker_info)
assert client.wait_load_job(label_2)
assert client.delete(table_name, [('k5', '=', '-70000'),], table_name)
assert client.batch_load(label_3, data_desc_list_3, broker=broker_info)
assert client.batch_load(label_4, data_desc_list_4, broker=broker_info)
assert client.batch_load(label_5, data_desc_list_5, broker=broker_info)
assert client.wait_load_job(label_3)
assert client.wait_load_job(label_4)
assert client.wait_load_job(label_5)
sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_13, sql=sql, client=client)
def test_delete_and_schema_change():
"""
{
"title": "test_sys_null.test_delete_and_schema_change",
"describe": "测试delete and schema change",
"tag": "system,p1"
}
"""
"""
测试delete and schema change
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.use(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
assert client.delete(table_name, [('k1', '>=', '127'),], table_name)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_ds_1, sql=sql, client=client)
column_list = [('add_key', 'INT', None), ]
assert client.schema_change_add_column(table_name, column_list,
after_column_name='k2', is_wait_job=True, set_null=True)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_list_data_2, sql=sql, client=client)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
assert client.delete(table_name, [('k1', '>', '127'),], table_name)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_ds_2, sql=sql, client=client)
client.clean(database_name)
def test_largeint():
"""
{
"title": "test_sys_null.test_largeint",
"describe": "测试largeint",
"tag": "system,p1"
}
"""
"""
测试largeint
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_4, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_14_1, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_14_2, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_14, sql=sql, client=client)
client.clean(database_name)
def test_all_null():
"""
{
"title": "test_sys_null.test_all_null",
"describe": "测试 all null",
"tag": "system,p1"
}
"""
"""
测试 all null
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.create_table(table_name, DATA.schema_4, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_all_null, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2, k1' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_all_null, sql=sql, client=client)
client.clean(database_name)
def test_bloom_filter():
"""
{
"title": "test_sys_null.test_bloom_filter",
"describe": "测试bloom filter",
"tag": "system,p1"
}
"""
"""
测试bloom filter
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
bloom_filter_column_list = ['k5', 'k7', 'k9']
client.create_table(table_name, DATA.schema_2, storage_type='column',
bloom_filter_column_list=bloom_filter_column_list, set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_5, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s where ' \
'k5 = -170141183460469231731687303715884105727' \
% (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_1, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s where k5 is NULL' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_1_1, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s where k7 = "2452-09-22 13:38:55"' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_2, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s where k7 in ' \
'("2452-09-22 13:38:55", "2479-02-15 20:33:27") order by k1' \
% (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_2_1, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s where k9 = "中文"' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_3, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s where v7 = "2677-02-03"' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_4, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s where v9 = "d"' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_4, sql=sql, client=client)
sql = 'SELECT * FROM %s.%s where k1 is NULL ' \
'and k2 is NULL and k3 is NULL and k4 is NULL and k6 is NULL ' \
'and k7 is NULL and k8 is NULL and k9 is NULL and k10 is NULL ' \
'and v1 is NULL and v2 is NULL and v3 is NULL and v4 is NULL ' \
'and v6 is NULL and v7 is NULL and v8 is NULL and v9 is NULL ' \
'and v10 is NULL' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_15_1_1, sql=sql, client=client)
client.clean(database_name)
def test_join():
"""
{
"title": "test_sys_null.test_join",
"describe": "测试join",
"tag": "system,p1"
}
"""
"""
测试join
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.use(database_name)
client.create_table(table_name, DATA.schema_2, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT a.v1, b.v2 FROM %s as a, %s as b ' \
'WHERE a.k1=b.k1 ORDER BY a.k2 nulls last' % (table_name, table_name)
assert common.check_by_file(DATA.expected_file_16, sql=sql, client=client)
client.clean(database_name)
def test_varchar_hash_null():
"""
{
"title": "test_sys_null.test_varchar_hash_null",
"describe": "varchar字段分桶字段多个版本全是NULL",
"tag": "system,p1"
}
"""
"""
varchar字段分桶字段多个版本全是NULL,会出现core
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
distribution_info = palo_client.DistributionInfo('HASH(K9)', 13)
client.create_table(table_name, DATA.schema_2, \
distribution_info = distribution_info, storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_17, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_17, sql=sql, client=client)
client.clean(database_name)
def test_modify():
"""
{
"title": "test_sys_null.test_modify",
"describe": "测试modify",
"tag": "system,p1"
}
"""
"""
测试modify
"""
database_name, table_name, index_name = util.gen_num_format_name_list()
LOG.info(L('', database_name=database_name, \
table_name=table_name, index_name=index_name))
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
password=config.fe_password, http_port=config.fe_http_port)
assert client
client.clean(database_name)
client.create_database(database_name)
client.use(database_name)
distribution_info = palo_client.DistributionInfo('HASH(K2)', 13)
client.create_table(table_name, DATA.schema_2, distribution_info = distribution_info,
storage_type='column', set_null=True)
assert client.show_tables(table_name)
assert client.get_index(table_name)
data_desc_list = palo_client.LoadDataInfo(DATA.hdfs_file_4, table_name)
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
sql = 'ALTER TABLE %s.%s ' % (database_name, table_name) + \
'MODIFY COLUMN k1 LARGEINT NULL, MODIFY COLUMN k9 VARCHAR(1024) NULL, ' + \
'MODIFY COLUMN v2 LARGEINT SUM NULL, MODIFY COLUMN v9 VARCHAR(1024) REPLACE NULL'
assert () == client.execute(sql)
client.wait_table_schema_change_job(table_name, database_name)
sql = 'SELECT * FROM %s.%s ORDER BY k2 nulls last, k1 nulls last' % (database_name, table_name)
assert common.check_by_file(DATA.expected_file_4, sql=sql, client=client)
client.clean(database_name)
if __name__ == '__main__':
setup_module()
test_null_be()