465 lines
17 KiB
Python
465 lines
17 KiB
Python
#!/bin/env python
|
|
# -*- coding: utf-8 -*-
|
|
# Licensed to the Apache Software Foundation (ASF) under one
|
|
# or more contributor license agreements. See the NOTICE file
|
|
# distributed with this work for additional information
|
|
# regarding copyright ownership. The ASF licenses this file
|
|
# to you under the Apache License, Version 2.0 (the
|
|
# "License"); you may not use this file except in compliance
|
|
# with the License. You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing,
|
|
# software distributed under the License is distributed on an
|
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
# KIND, either express or implied. See the License for the
|
|
# specific language governing permissions and limitations
|
|
# under the License.
|
|
|
|
############################################################################
|
|
#
|
|
# @file test_sys_partition_basic.py
|
|
# @date 2015/05/13 15:26:21
|
|
# @brief This file is a test file for palo data loading and verifying.
|
|
#
|
|
#############################################################################
|
|
|
|
"""
|
|
按照所有支持分区的数据类型进行分区建表,对查询结果进行正确性校验
|
|
"""
|
|
from data import partition as DATA
|
|
from lib import palo_config
|
|
from lib import palo_client
|
|
from lib import util
|
|
import random
|
|
|
|
LOG = palo_client.LOG
|
|
L = palo_client.L
|
|
config = palo_config.config
|
|
broker_info = palo_config.broker_info
|
|
|
|
|
|
def setup_module():
|
|
"""
|
|
setUp
|
|
"""
|
|
global client
|
|
client = palo_client.get_client(config.fe_host, config.fe_query_port, user=config.fe_user,
|
|
password=config.fe_password, http_port=config.fe_http_port)
|
|
|
|
|
|
def check_partition_list(table_name, partition_name_list):
|
|
"""
|
|
验证分区是否创建成功
|
|
"""
|
|
for partition_name in partition_name_list:
|
|
assert client.get_partition(table_name, partition_name)
|
|
|
|
|
|
def check_load_and_verify(table_name, partition_name_list):
|
|
"""
|
|
验证表是否创建成功,分区是否创建成功,导入数据,校验
|
|
"""
|
|
data_desc_list = palo_client.LoadDataInfo(DATA.file_path_1, table_name)
|
|
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
|
|
assert client.verify(DATA.expected_data_file_list_1, table_name)
|
|
assert client.batch_load(util.get_label(), data_desc_list, is_wait=True, broker=broker_info)
|
|
assert client.verify(list(DATA.expected_data_file_list_1) * 2, table_name)
|
|
|
|
|
|
def partition_check(table_name, column_name, partition_name_list, \
|
|
partition_value_list, distribution_type, bucket_num, storage_type):
|
|
"""
|
|
检查,验证
|
|
"""
|
|
partition_info = palo_client.PartitionInfo(column_name, \
|
|
partition_name_list, partition_value_list)
|
|
distribution_info = palo_client.DistributionInfo(distribution_type, bucket_num)
|
|
client.create_table(table_name, DATA.schema_1, \
|
|
partition_info, distribution_info)
|
|
assert client.show_tables(table_name)
|
|
check_partition_list(table_name, partition_name_list)
|
|
check_load_and_verify(table_name, partition_name_list)
|
|
|
|
|
|
def test_partition_by_tinyint_random_column_1():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_column_1",
|
|
"describe": "tinyint分区, 边界值,random, random_bucket_num, column",
|
|
"tag": "system,p0,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
tinyint分区, 边界值,random, random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k1', \
|
|
partition_name_list, partition_value_list, \
|
|
'RANDOM', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_tinyint_random_hash_1():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_1",
|
|
"describe": "tinyint分区, 边界值,hash(分区列), random_bucket_num, column",
|
|
"tag": "system,p1,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
tinyint分区, 边界值,hash(分区列), random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k1', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k1)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_tinyint_random_hash_2():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_2",
|
|
"describe": "tinyint分区, 边界值,hash(非分区列), random_bucket_num, column",
|
|
"tag": "system,p0,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
tinyint分区, 边界值,hash(非分区列), random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k1', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k2)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_tinyint_random_hash_3():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_3",
|
|
"describe": "tinyint分区, 边界值,hash(所有非分区列), random_bucket_num, column",
|
|
"tag": "system,p0,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
tinyint分区, 边界值,hash(所有非分区列), random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k1', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k2, k3, k4, k5)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_tinyint_random_hash_4():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_4",
|
|
"describe": "tinyint分区, 边界值,hash(所有列), random_bucket_num, column",
|
|
"tag": "system,p0,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
tinyint分区, 边界值,hash(所有列), random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k1', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k1, k2, k3, k4, k5)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_tinyint_random_hash_5():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_tinyint_random_hash_5",
|
|
"describe": " tinyint分区, 边界值,hash(部分非分区列), random_bucket_num, column",
|
|
"tag": "system,p1,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
tinyint分区, 边界值,hash(部分非分区列), random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = ['-127', '-1', '0', '1', '126', '127']
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k1', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k3, k4, k5)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_smallint():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_smallint",
|
|
"describe": "smallint分区",
|
|
"tag": "system,p1"
|
|
}
|
|
"""
|
|
"""
|
|
smallint分区
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', 'partition_d']
|
|
partition_value_list = ['10', '20', '30', 'MAXVALUE']
|
|
|
|
partition_check(table_name, 'k2', partition_name_list, \
|
|
partition_value_list, 'RANDOM', 13, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_smallint_over_range():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_smallint_over_range",
|
|
"describe": "smallint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column",
|
|
"tag": "system,p1,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
smallint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = [str(-2 ** 15 + 1), str(-2 ** 15 + 2), \
|
|
'0', '1', str(2 ** 15 - 2), str(2 ** 15 - 1)]
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k2', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k4, k5, k1)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_int():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_int",
|
|
"describe": "int分区",
|
|
"tag": "system,p1"
|
|
}
|
|
"""
|
|
"""
|
|
int分区
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', 'partition_d']
|
|
partition_value_list = ['100', '200', '300', 'MAXVALUE']
|
|
|
|
partition_check(table_name, 'k3', partition_name_list, \
|
|
partition_value_list, 'RANDOM', 13, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_int_over_range():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_int_over_range",
|
|
"describe": "int分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column",
|
|
"tag": "system,p1,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
int分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = [str(-2 ** 31 + 1), str(-2 ** 31 + 2), \
|
|
'0', '1', str(2 ** 31 - 2), str(2 ** 31 - 1)]
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k3', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k2, k4, k5, k1)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_bigint():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_bigint",
|
|
"describe": "bigint分区",
|
|
"tag": "system,p1"
|
|
}
|
|
"""
|
|
"""
|
|
bigint分区
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', 'partition_d']
|
|
partition_value_list = ['1000', '2000', '3000', 'MAXVALUE']
|
|
|
|
partition_check(table_name, 'k4', partition_name_list, \
|
|
partition_value_list, 'RANDOM', 13, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_bigint_over_range():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_bigint_over_range",
|
|
"describe": "bigint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column",
|
|
"tag": "system,p1,fuzz"
|
|
}
|
|
"""
|
|
"""
|
|
bigint分区, 边界值,hash(部分非分区列),乱序,random_bucket_num, column
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a', 'partition_b', 'partition_c', \
|
|
'partition_d', 'partition_e', 'partition_f']
|
|
partition_value_list = [str(-2 ** 63 + 1), str(-2 ** 63 + 2), \
|
|
'0', '1', str(2 ** 63 - 2), str(2 ** 63 - 1)]
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k4', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k2, k5, k1)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def test_partition_by_bigint_one_partition():
|
|
"""
|
|
{
|
|
"title": "test_sys_partition_basic_a.test_partition_by_bigint_one_partition",
|
|
"describe": "bigint分区, 一个分区",
|
|
"tag": "system,p1"
|
|
}
|
|
"""
|
|
"""
|
|
bigint分区, 一个分区
|
|
"""
|
|
database_name, table_name, index_name = util.gen_num_format_name_list()
|
|
LOG.info(L('', database_name=database_name, \
|
|
table_name=table_name, index_name=index_name))
|
|
client.clean(database_name)
|
|
client.create_database(database_name)
|
|
|
|
partition_name_list = ['partition_a']
|
|
partition_value_list = [str(2 ** 63 - 1)]
|
|
|
|
random_bucket_num = random.randrange(1, 300)
|
|
LOG.info(L('', random_bucket_num=random_bucket_num))
|
|
partition_check(table_name, 'k4', \
|
|
partition_name_list, partition_value_list, \
|
|
'HASH(k2, k5, k1)', random_bucket_num, 'column')
|
|
client.clean(database_name)
|
|
|
|
|
|
def teardown_module():
|
|
"""
|
|
tearDown
|
|
"""
|
|
pass
|
|
|
|
|
|
if __name__ == '__main__':
|
|
setup_module()
|
|
print(broker_info)
|
|
test_partition_by_int()
|
|
|