// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. #include #include #include "common/object_pool.h" #include "exprs/expr.h" #include "exprs/expr_context.h" #include "olap/row_block.h" #include "olap/olap_table.h" #include "runtime/runtime_state.h" #include "util/debug_util.h" #include "util/logging.h" using std::vector; using std::string; using std::endl; using std::stringstream; namespace doris { class TestRowBlock : public testing::Test { public: TestRowBlock() {} void SetUp() { } void TearDown() { } void SetRows(RowBlock& row_block) { } }; TEST_F(TestRowBlock, init) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } { // has nullbyte RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = true; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); // num_rows * (num_nullbytes + bigint + char + varchar) ASSERT_EQ(1024 * (3 + 8 + 10 + (4 + 20)), block.buf_len()); } { // has nullbyte RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = false; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); // num_rows * (num_nullbytes + bigint + char + varchar) ASSERT_EQ(1024 * (3 + 8 + 10 + (4 + 20)), block.buf_len()); } } TEST_F(TestRowBlock, write_and_read) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } // RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = true; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); RowCursor row; row.init(fields); for (int i = 0; i < 5; ++i) { block.get_row(i, &row); // bigint { int64_t val = i; row.set_not_null(0); row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'a' + i, 10); Slice val(buf, 10); row.set_not_null(1); row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0' + i, 10); Slice val(buf, 10); row.set_not_null(2); row.set_field_content(2, (const char*)&val, block.mem_pool()); } } block.finalize(5); ASSERT_EQ(5, block.row_num()); char serialized_buf[2048]; size_t written_len = 0; res = block.serialize_to_row_format(serialized_buf, 2048, &written_len, OLAP_COMP_STORAGE); ASSERT_EQ(OLAP_SUCCESS, res); { RowBlock resolve_block(fields); block_info.checksum = block.row_block_info().checksum; block_info.row_num = 5; res = resolve_block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); res = resolve_block.decompress(serialized_buf, written_len, OLAP_COMP_STORAGE); ASSERT_EQ(OLAP_SUCCESS, res); ASSERT_EQ(5, resolve_block.row_num()); for (int i = 0; i < 5; ++i) { resolve_block.get_row(i, &row); { ASSERT_FALSE(row.is_null(0)); ASSERT_EQ(i, *(int64_t*)row.get_field_content_ptr(0)); } { ASSERT_FALSE(row.is_null(1)); Slice* slice = (Slice*)row.get_field_content_ptr(1); char buf[10]; memset(buf, 'a' + i, 10); ASSERT_EQ(10, slice->size); ASSERT_EQ(0, memcmp(buf, slice->data, 10)); } { ASSERT_FALSE(row.is_null(2)); Slice* slice = (Slice*)row.get_field_content_ptr(2); char buf[20]; memset(buf, '0' + i, 10); ASSERT_EQ(10, slice->size); ASSERT_EQ(0, memcmp(buf, slice->data, 10)); } } } } TEST_F(TestRowBlock, write_and_read_without_nullbyte) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } // RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = false; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); RowCursor row; row.init(fields); for (int i = 0; i < 5; ++i) { block.get_row(i, &row); // bigint { int64_t val = i; row.set_not_null(0); row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'a' + i, 10); Slice val(buf, 10); row.set_not_null(1); row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0' + i, 10); Slice val(buf, 10); row.set_not_null(2); row.set_field_content(2, (const char*)&val, block.mem_pool()); } } block.finalize(5); ASSERT_EQ(5, block.row_num()); char serialized_buf[2048]; size_t written_len = 0; res = block.serialize_to_row_format(serialized_buf, 2048, &written_len, OLAP_COMP_STORAGE); ASSERT_EQ(OLAP_SUCCESS, res); { RowBlock resolve_block(fields); block_info.checksum = block.row_block_info().checksum; block_info.row_num = 5; res = resolve_block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); res = resolve_block.decompress(serialized_buf, written_len, OLAP_COMP_STORAGE); ASSERT_EQ(OLAP_SUCCESS, res); ASSERT_EQ(5, resolve_block.row_num()); for (int i = 0; i < 5; ++i) { resolve_block.get_row(i, &row); { ASSERT_FALSE(row.is_null(0)); ASSERT_EQ(i, *(int64_t*)row.get_field_content_ptr(0)); } { ASSERT_FALSE(row.is_null(1)); Slice* slice = (Slice*)row.get_field_content_ptr(1); char buf[10]; memset(buf, 'a' + i, 10); ASSERT_EQ(10, slice->size); ASSERT_EQ(0, memcmp(buf, slice->data, 10)); } { ASSERT_FALSE(row.is_null(2)); Slice* slice = (Slice*)row.get_field_content_ptr(2); char buf[20]; memset(buf, '0' + i, 10); ASSERT_EQ(10, slice->size); ASSERT_EQ(0, memcmp(buf, slice->data, 10)); } } } } TEST_F(TestRowBlock, compress_failed) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } // RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = true; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); RowCursor row; row.init(fields); for (int i = 0; i < 5; ++i) { block.get_row(i, &row); // bigint { int64_t val = i; row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'a' + i, 10); Slice val(buf, 10); row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0' + i, 10); Slice val(buf, 10); row.set_field_content(2, (const char*)&val, block.mem_pool()); } } block.finalize(5); ASSERT_EQ(5, block.row_num()); char serialized_buf[2048]; size_t written_len = 0; res = block.serialize_to_row_format(serialized_buf, 1, &written_len, OLAP_COMP_STORAGE); ASSERT_NE(OLAP_SUCCESS, res); } TEST_F(TestRowBlock, decompress_failed) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } // RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = true; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); RowCursor row; row.init(fields); for (int i = 0; i < 5; ++i) { block.get_row(i, &row); // bigint { int64_t val = i; row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'a' + i, 10); Slice val(buf, 10); row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0' + i, 10); Slice val(buf, 10); row.set_field_content(2, (const char*)&val, block.mem_pool()); } } block.finalize(5); ASSERT_EQ(5, block.row_num()); char serialized_buf[2048]; size_t written_len = 0; res = block.serialize_to_row_format(serialized_buf, 2048, &written_len, OLAP_COMP_STORAGE); ASSERT_EQ(OLAP_SUCCESS, res); { // checksum failed RowBlock resolve_block(fields); block_info.checksum = 0; block_info.row_num = 5; res = resolve_block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); res = resolve_block.decompress(serialized_buf, written_len, OLAP_COMP_STORAGE); ASSERT_NE(OLAP_SUCCESS, res); } { // buffer is not ok RowBlock resolve_block(fields); block_info.checksum = block.row_block_info().checksum; block_info.row_num = 5; res = resolve_block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); res = resolve_block.decompress(serialized_buf, written_len - 1, OLAP_COMP_STORAGE); ASSERT_NE(OLAP_SUCCESS, res); } } TEST_F(TestRowBlock, find_row) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } // RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = true; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); RowCursor row; row.init(fields); for (int i = 0; i < 5; ++i) { block.get_row(i, &row); // bigint { int64_t val = i; row.set_not_null(0); row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'a' + i, 10); Slice val(buf, 10); row.set_not_null(1); row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0' + i, 10); Slice val(buf, 10); row.set_not_null(2); row.set_field_content(2, (const char*)&val, block.mem_pool()); } } block.finalize(5); ASSERT_EQ(5, block.row_num()); { RowCursor find_row; find_row.init(fields); for (int i = 0; i < 5; ++i) { // bigint { int64_t val = i; find_row.set_not_null(0); find_row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'a' + i, 10); Slice val(buf, 10); find_row.set_not_null(1); find_row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0' + i, 10); Slice val(buf, 10); find_row.set_not_null(2); find_row.set_field_content(2, (const char*)&val, block.mem_pool()); } uint32_t row_index; res = block.find_row(find_row, false, &row_index); ASSERT_EQ(OLAP_SUCCESS, res); ASSERT_EQ(i, row_index); res = block.find_row(find_row, true, &row_index); ASSERT_EQ(OLAP_SUCCESS, res); ASSERT_EQ(i + 1, row_index); } { // bigint { int64_t val = 1; find_row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'c', 9); Slice val(buf, 9); find_row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0', 10); Slice val(buf, 10); find_row.set_field_content(2, (const char*)&val, block.mem_pool()); } uint32_t row_index; res = block.find_row(find_row, true, &row_index); ASSERT_EQ(OLAP_SUCCESS, res); ASSERT_EQ(2, row_index); } { // bigint { int64_t val = -1; find_row.set_field_content(0, (const char*)&val, block.mem_pool()); } // char { char buf[10]; memset(buf, 'c', 9); Slice val(buf, 9); find_row.set_field_content(1, (const char*)&val, block.mem_pool()); } // varchar { char buf[10]; memset(buf, '0', 10); Slice val(buf, 10); find_row.set_field_content(2, (const char*)&val, block.mem_pool()); } uint32_t row_index; res = block.find_row(find_row, true, &row_index); ASSERT_EQ(OLAP_SUCCESS, res); ASSERT_EQ(0, row_index); } } } TEST_F(TestRowBlock, clear) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } // RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = true; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); block.finalize(5); ASSERT_EQ(5, block.row_num()); ASSERT_EQ(1024, block.capacity()); block.clear(); ASSERT_EQ(1024, block.row_num()); } TEST_F(TestRowBlock, pos_limit) { std::vector fields; { // k1: bigint { FieldInfo info; info.name = "k1"; info.type = OLAP_FIELD_TYPE_BIGINT; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 8; info.is_key = true; fields.push_back(info); } // k2: char { FieldInfo info; info.name = "k2"; info.type = OLAP_FIELD_TYPE_CHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 10; info.is_key = true; fields.push_back(info); } // k3: varchar { FieldInfo info; info.name = "k3"; info.type = OLAP_FIELD_TYPE_VARCHAR; info.aggregation = OLAP_FIELD_AGGREGATION_NONE; info.length = 20; info.is_key = true; fields.push_back(info); } } // RowBlock block(fields); RowBlockInfo block_info; block_info.row_num = 1024; block_info.data_file_type = COLUMN_ORIENTED_FILE; block_info.null_supported = true; auto res = block.init(block_info); ASSERT_EQ(OLAP_SUCCESS, res); // assert init value ASSERT_EQ(0, block.pos()); ASSERT_EQ(0, block.limit()); ASSERT_FALSE(block.has_remaining()); ASSERT_EQ(DEL_PARTIAL_SATISFIED, block.block_status()); block.set_limit(100); ASSERT_EQ(100, block.limit()); ASSERT_TRUE(block.has_remaining()); ASSERT_EQ(100, block.remaining()); block.set_pos(2); ASSERT_TRUE(block.has_remaining()); ASSERT_EQ(98, block.remaining()); block.pos_inc(); ASSERT_TRUE(block.has_remaining()); ASSERT_EQ(97, block.remaining()); block.set_block_status(DEL_SATISFIED); ASSERT_EQ(DEL_SATISFIED, block.block_status()); } } // @brief Test Stub int main(int argc, char** argv) { std::string conffile = std::string(getenv("DORIS_HOME")) + "/conf/be.conf"; if (!doris::config::init(conffile.c_str(), false)) { fprintf(stderr, "error read config file. \n"); return -1; } doris::init_glog("be-test"); int ret = doris::OLAP_SUCCESS; testing::InitGoogleTest(&argc, argv); ret = RUN_ALL_TESTS(); return ret; }