Files
doris/regression-test/suites/load/insert/test_array_insert.groovy
Mingyu Chen 32b1456b28 [feature-wip](array) remove array config and check array nested depth (#13428)
1. remove FE config `enable_array_type`
2. limit the nested depth of array in FE side.
3. Fix bug that when loading array from parquet, the decimal type is treated as bigint
4. Fix loading array from csv(vec-engine), handle null and "null"
5. Change the csv array loading behavior, if the array string format is invalid in csv, it will be converted to null. 
6. Remove `check_array_format()`, because it's logic is wrong and meaningless
7. Add stream load csv test cases and more parquet broker load tests
2022-10-20 15:52:31 +08:00

230 lines
9.3 KiB
Groovy

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
suite("test_array_insert", "load") {
// define a sql table
def testTable = "tbl_test_array_insert"
def testTable01 = "tbl_test_array_insert01"
def testTable02 = "tbl_test_array_insert02"
def create_test_table = {testTablex, enable_vectorized_flag ->
if (enable_vectorized_flag) {
sql """ set enable_vectorized_engine = true """
} else {
sql """ set enable_vectorized_engine = false """
}
def result1 = sql """
CREATE TABLE IF NOT EXISTS ${testTable} (
`k1` INT(11) NULL COMMENT "",
`k2` ARRAY<LARGEINT> NULL COMMENT ""
) ENGINE=OLAP
DUPLICATE KEY(`k1`)
DISTRIBUTED BY HASH(`k1`) BUCKETS 1
PROPERTIES (
"replication_allocation" = "tag.location.default: 1",
"storage_format" = "V2"
)
"""
// DDL/DML return 1 row and 3 column, the only value is update row count
assertTrue(result1.size() == 1)
assertTrue(result1[0].size() == 1)
assertTrue(result1[0][0] == 0, "Create table should update 0 rows")
// insert 1 row to check whether the table is ok
def result2 = sql "INSERT INTO ${testTable} VALUES (100, [9223372036854775808])"
assertTrue(result2.size() == 1)
assertTrue(result2[0].size() == 1)
assertTrue(result2[0][0] == 1, "Insert should update 1 rows")
}
def create_test_table01 = {testTabley ->
def result1 = sql """
CREATE TABLE IF NOT EXISTS ${testTable01} (
`k1` int(11) NULL,
`k2` smallint(6) NULL,
`k3` int(11) NULL,
`k4` bigint(20) NULL,
`k5` char(20) NULL,
`k6` varchar(50) NULL,
`k7` date NULL,
`k8` datetime NULL,
`k9` float NULL,
`k10` double NULL,
`k11` decimal(20, 6) NULL,
`k12` boolean NULL,
`k13` text NULL
) ENGINE=OLAP
DUPLICATE KEY(`k1`)
COMMENT 'OLAP'
DISTRIBUTED BY HASH(`k1`) BUCKETS 1
PROPERTIES (
"replication_allocation" = "tag.location.default: 1",
"in_memory" = "false",
"storage_format" = "V2",
"disable_auto_compaction" = "false"
)
"""
// DDL/DML return 1 row and 3 column, the only value is update row count
assertTrue(result1.size() == 1)
assertTrue(result1[0].size() == 1)
assertTrue(result1[0][0] == 0, "Create table should update 0 rows")
// insert 1 row to check whether the table is ok
def result2 = sql """ INSERT INTO ${testTable01} VALUES (200, 2, 32768, 65535, 'b', "hello",
'2022-07-13', '2022-07-13 12:30:00', 0.67, 3.1415926, 6.67, false, 'happy life')
"""
assertTrue(result2.size() == 1)
assertTrue(result2[0].size() == 1)
assertTrue(result2[0][0] == 1, "Insert should update 1 rows")
}
def create_test_table02 = {testTablez ->
def result1 = sql """
CREATE TABLE IF NOT EXISTS ${testTable02} (
`k1` int(11) NULL,
`k2` array<smallint(6)> NULL,
`k3` array<int(11)> NULL,
`k4` array<bigint(20)> NULL,
`k5` array<char(20)> NULL,
`k6` array<varchar(50)> NULL,
`k7` array<date> NULL,
`k8` array<datetime> NULL,
`k9` array<float> NULL,
`k10` array<double> NULL,
`k11` array<decimal(20, 6)> NULL,
`k12` array<boolean> NULL,
`k13` array<text> NULL
) ENGINE=OLAP
DUPLICATE KEY(`k1`)
COMMENT 'OLAP'
DISTRIBUTED BY HASH(`k1`) BUCKETS 1
PROPERTIES (
"replication_allocation" = "tag.location.default: 1",
"in_memory" = "false",
"storage_format" = "V2",
"disable_auto_compaction" = "false"
)
"""
// DDL/DML return 1 row and 3 column, the only value is update row count
assertTrue(result1.size() == 1)
assertTrue(result1[0].size() == 1)
assertTrue(result1[0][0] == 0, "Create table should update 0 rows")
// insert 1 row to check whether the table is ok
def result2 = sql """ INSERT INTO ${testTable02} VALUES (100, [1, 2, 3], [32767, 32768, 32769], [65534, 65535, 65536],
['a', 'b', 'c'], ["hello", "world"], ['2022-07-13'], ['2022-07-13 12:30:00'], [0.33, 0.67], [3.1415926, 0.878787878],
[4, 5.5, 6.67], [true, false], ['happy life'])
"""
assertTrue(result2.size() == 1)
assertTrue(result2[0].size() == 1)
assertTrue(result2[0][0] == 1, "Insert should update 1 rows")
}
// case1: enable_vectorized_flag = false
try {
sql "DROP TABLE IF EXISTS ${testTable}"
create_test_table.call(testTable, false)
sql "INSERT INTO ${testTable} VALUES (1, [117341182548128045443221445, 170141183460469231731687303715884105727])"
// select the table and check whether the data is correct
qt_select "select * from ${testTable} order by k1"
} finally {
try_sql("DROP TABLE IF EXISTS ${testTable}")
}
// case2: enable_vectorized_flag = true
try {
sql "DROP TABLE IF EXISTS ${testTable}"
create_test_table.call(testTable, true)
sql "INSERT INTO ${testTable} VALUES (1, [117341182548128045443221446, 170141183460469231731687303715884105727])"
// select the table and check whether the data is correct
qt_select "select * from ${testTable} order by k1"
} finally {
try_sql("DROP TABLE IF EXISTS ${testTable}")
}
// case3: test the collect_list result to insert
try {
sql "DROP TABLE IF EXISTS ${testTable01}"
sql "DROP TABLE IF EXISTS ${testTable02}"
create_test_table01.call(testTable01)
create_test_table02.call(testTable02)
sql """INSERT INTO ${testTable02} select k1, collect_list(k2), collect_list(k3), collect_list(k4), collect_list(k5), collect_list(k6),
collect_list(k7), collect_list(k8), collect_list(k9), collect_list(k10), collect_list(k11), collect_list(k12), collect_list(k13)
from ${testTable01} group by k1;
"""
// select the table and check whether the data is correct
qt_select "select * from ${testTable02} order by k1"
} finally {
try_sql("DROP TABLE IF EXISTS ${testTable01}")
try_sql("DROP TABLE IF EXISTS ${testTable02}")
}
// case4: test the array_sort(collect_list()) result to insert and select
try {
sql "DROP TABLE IF EXISTS ${testTable01}"
sql "DROP TABLE IF EXISTS ${testTable02}"
create_test_table01.call(testTable01)
create_test_table02.call(testTable02)
sql """INSERT INTO ${testTable02} select k1, array_sort(collect_list(k2)), array_sort(collect_list(k3)), array_sort(collect_list(k4)),
array_sort(collect_list(k5)), array_sort(collect_list(k6)), array_sort(collect_list(k7)), array_sort(collect_list(k8)),
array_sort(collect_list(k9)), array_sort(collect_list(k10)), array_sort(collect_list(k11)), array_sort(collect_list(k12)),
array_sort(collect_list(k13)) from ${testTable01} group by k1;
"""
// select the table and check whether the data is correct
qt_select "select * from ${testTable02} order by k1"
qt_select "select array_avg(k2), array_avg(k3), array_avg(k4), array_avg(k9), array_avg(k10) from ${testTable02} order by k1"
} finally {
try_sql("DROP TABLE IF EXISTS ${testTable01}")
try_sql("DROP TABLE IF EXISTS ${testTable02}")
}
// case5: test to insert 'array<boolean>'
try {
sql "DROP TABLE IF EXISTS ${testTable02}"
create_test_table02.call(testTable02)
sql """INSERT INTO ${testTable02} VALUES (200, [1, 2, 3], [32767, 32768, 32769], [65534, 65535, 65536],
['a', 'b', 'c'], ["hello", "world"], ['2022-07-13'], ['2022-07-13 12:30:00'], [0.33, 0.67], [3.1415926, 0.878787878],
[4, 5.5, 6.67], '[1, 0, 1, 0]', ['happy life'])
"""
// select the table and check whether the data is correct
qt_select "select * from ${testTable02} order by k1"
} finally {
try_sql("DROP TABLE IF EXISTS ${testTable02}")
}
}