 566e920620
			
		
	
	566e920620
	
	
	
		
			
			Co-authored-by: wangt1xiuyi <13547954130@163.com> Co-authored-by: yangqise7en <877793735@qq.com> Co-authored-by: Zach41 <zach_41@163.com>
		
			
				
	
	
		
			392 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			392 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /**
 | |
|  * Copyright (c) 2022 OceanBase
 | |
|  * OceanBase is licensed under Mulan PubL v2.
 | |
|  * You can use this software according to the terms and conditions of the Mulan PubL v2.
 | |
|  * You may obtain a copy of Mulan PubL v2 at:
 | |
|  *          http://license.coscl.org.cn/MulanPubL-2.0
 | |
|  * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
 | |
|  * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
 | |
|  * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
 | |
|  * See the Mulan PubL v2 for more details.
 | |
|  */
 | |
| 
 | |
| #define USING_LOG_PREFIX STORAGE
 | |
| 
 | |
| #include <gtest/gtest.h>
 | |
| #define protected public
 | |
| #define private public
 | |
| #include "lib/string/ob_sql_string.h"
 | |
| #include "storage/blocksstable/index_block/ob_index_block_aggregator.h"
 | |
| #include "ob_row_generate.h"
 | |
| 
 | |
| 
 | |
| namespace oceanbase
 | |
| {
 | |
| namespace blocksstable
 | |
| {
 | |
| using namespace common;
 | |
| using namespace storage;
 | |
| using namespace share::schema;
 | |
| 
 | |
| class TestIndexBlockAggregator : public ::testing::Test
 | |
| {
 | |
| public:
 | |
|   TestIndexBlockAggregator() {}
 | |
|   virtual ~TestIndexBlockAggregator() {}
 | |
|   virtual void SetUp() {}
 | |
|   virtual void TearDown() {}
 | |
|   void init_schema(const int64_t col_count, const ObObjType *col_obj_types);
 | |
|   void init_skip_index_meta(const int64_t idx_col_count, const int64_t *min_max_col_idxs);
 | |
| 
 | |
|   void generate_row_by_seed(const int64_t seed, ObDatumRow &datum_row);
 | |
|   void reset_min_max_row();
 | |
|   void update_min_max_row(const ObDatumRow &row);
 | |
|   void validate_agg_row(const ObDatumRow &row, int64_t nop_col_cnt = 0, int64_t *nop_col_idxs = nullptr);
 | |
|   void set_nop_cols(ObDatumRow &row, int64_t nop_col_cnt = 0, int64_t *nop_col_idxs = nullptr);
 | |
|   bool is_col_in_nop_col_arr(const int64_t col_idx, const int64_t nop_col_cnt, int64_t *nop_col_idxs);
 | |
|   void serialize_agg_row(const ObDatumRow &agg_row, const char *&row_buf, int64_t &row_size);
 | |
|   void get_cmp_func(const ObColDesc &col_desc, ObStorageDatumCmpFunc &cmp_func);
 | |
| 
 | |
| private:
 | |
|   ObArenaAllocator allocator_;
 | |
|   ObRowGenerate row_generate_;
 | |
|   ObArray<ObColDesc> col_descs_;
 | |
|   ObArray<ObSkipIndexColMeta> full_agg_metas_;
 | |
|   ObTableSchema schema_;
 | |
|   const ObObjType *col_obj_types_;
 | |
|   int64_t col_count_;
 | |
|   int64_t rowkey_count_;
 | |
|   int64_t full_column_count_;
 | |
|   ObDatumRow max_row_;
 | |
|   ObDatumRow min_row_;
 | |
|   int64_t *null_count_arr_;
 | |
|   ObAggRowWriter agg_row_writer_;
 | |
| };
 | |
| 
 | |
| void TestIndexBlockAggregator::init_schema(const int64_t col_count, const ObObjType *col_obj_types)
 | |
| {
 | |
|   col_count_ = col_count;
 | |
|   rowkey_count_ = 1;
 | |
|   col_obj_types_ = col_obj_types;
 | |
|   ObColumnSchemaV2 col;
 | |
|   schema_.reset();
 | |
|   schema_.set_tenant_id(1);
 | |
|   schema_.set_tablegroup_id(1);
 | |
|   schema_.set_database_id(1);
 | |
|   schema_.set_table_id(200001);
 | |
|   schema_.set_table_name("test_index_aggregator_schema");
 | |
|   schema_.set_rowkey_column_num(rowkey_count_);
 | |
|   schema_.set_max_column_id(col_count_ * 2);
 | |
|   schema_.set_block_size(2 * 1024);
 | |
| 
 | |
|   ObSqlString str;
 | |
|   for (int64_t i = 0; i < col_count_; ++i) {
 | |
|     col.reset();
 | |
|     col.set_table_id(200001);
 | |
|     col.set_column_id(i + OB_APP_MIN_COLUMN_ID);
 | |
|     str.assign_fmt("test%ld", i);
 | |
|     col.set_column_name(str.ptr());
 | |
|     ObObjType type = col_obj_types_[i];
 | |
|     col.set_data_type(type);
 | |
|     if (ob_is_string_tc(type)) {
 | |
|       col.set_collation_type(CS_TYPE_UTF8MB4_GENERAL_CI);
 | |
|     } else {
 | |
|       col.set_collation_type(CS_TYPE_BINARY);
 | |
|     }
 | |
| 
 | |
|     if (0 == i) {
 | |
|       col.set_rowkey_position(1);
 | |
|     }
 | |
|     ASSERT_EQ(OB_SUCCESS, schema_.add_column(col));
 | |
|   }
 | |
|   ASSERT_EQ(OB_SUCCESS, row_generate_.init(schema_, true/*multi_version*/));
 | |
|   ASSERT_EQ(OB_SUCCESS, schema_.get_multi_version_column_descs(col_descs_));
 | |
|   full_column_count_ = col_descs_.count();
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::init_skip_index_meta(
 | |
|     const int64_t idx_col_count, const int64_t *min_max_col_idxs)
 | |
| {
 | |
|   for (int64_t i = 0; i < idx_col_count; ++i) {
 | |
|     ObSkipIndexColMeta meta;
 | |
|     ObSkipIndexColMeta max;
 | |
|     ObSkipIndexColMeta null_count;
 | |
|     meta.col_idx_ = min_max_col_idxs[i];
 | |
|     meta.col_type_ = SK_IDX_MIN;
 | |
|     ASSERT_EQ(OB_SUCCESS, full_agg_metas_.push_back(meta));
 | |
|     meta.col_type_ = SK_IDX_MAX;
 | |
|     ASSERT_EQ(OB_SUCCESS, full_agg_metas_.push_back(meta));
 | |
|     meta.col_type_ = SK_IDX_NULL_COUNT;
 | |
|     ASSERT_EQ(OB_SUCCESS, full_agg_metas_.push_back(meta));
 | |
|   }
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::generate_row_by_seed(const int64_t seed, ObDatumRow &datum_row)
 | |
| {
 | |
|   // if (0 == seed) {
 | |
|   if (false) {
 | |
|     for (int64_t i = 0; i < datum_row.get_column_count(); ++i) {
 | |
|       datum_row.storage_datums_[i].set_null();
 | |
|     }
 | |
|   } else {
 | |
|     ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(seed, datum_row));
 | |
|   }
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::reset_min_max_row()
 | |
| {
 | |
|   const int64_t agg_col_cnt = full_agg_metas_.count();
 | |
|   min_row_.reset();
 | |
|   max_row_.reset();
 | |
|   if (nullptr != null_count_arr_) {
 | |
|     allocator_.free(null_count_arr_);
 | |
|   }
 | |
|   ASSERT_EQ(OB_SUCCESS, min_row_.init(agg_col_cnt));
 | |
|   ASSERT_EQ(OB_SUCCESS, max_row_.init(agg_col_cnt));
 | |
|   for (int64_t i = 0; i < agg_col_cnt; ++i) {
 | |
|     min_row_.storage_datums_[i].set_max();
 | |
|     max_row_.storage_datums_[i].set_min();
 | |
|   }
 | |
|   null_count_arr_ = reinterpret_cast<int64_t *>(allocator_.alloc(sizeof(int64_t) * agg_col_cnt));
 | |
|   memset(null_count_arr_, 0, sizeof(int64_t) * agg_col_cnt);
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::update_min_max_row(const ObDatumRow &row)
 | |
| {
 | |
|   for (int64_t i = 0; i < row.get_column_count(); ++i) {
 | |
|     const ObStorageDatum &curr_datum = row.storage_datums_[i];
 | |
|     if (!curr_datum.is_null()) {
 | |
|       ObStorageDatum &min_datum = min_row_.storage_datums_[i];
 | |
|       ObStorageDatum &max_datum = max_row_.storage_datums_[i];
 | |
|       int min_cmp_ret = 0;
 | |
|       int max_cmp_ret = 0;
 | |
|       ObStorageDatumCmpFunc cmp_func;
 | |
|       get_cmp_func(col_descs_.at(i), cmp_func);
 | |
|       ASSERT_EQ(OB_SUCCESS, cmp_func.compare(curr_datum, min_datum, min_cmp_ret));
 | |
|       ASSERT_EQ(OB_SUCCESS, cmp_func.compare(curr_datum, max_datum, max_cmp_ret));
 | |
|       if (min_cmp_ret < 0) {
 | |
|         min_datum.deep_copy(curr_datum, allocator_);
 | |
|         if (min_datum.len_ > ObSkipIndexColMeta::MAX_SKIP_INDEX_COL_LENGTH) {
 | |
|           min_datum.len_ = ObSkipIndexColMeta::MAX_SKIP_INDEX_COL_LENGTH;
 | |
|         }
 | |
|       }
 | |
|       if (max_cmp_ret > 0) {
 | |
|         max_datum.deep_copy(curr_datum, allocator_);
 | |
|         if (max_datum.len_ > ObSkipIndexColMeta::MAX_SKIP_INDEX_COL_LENGTH) {
 | |
|           max_datum.len_ = ObSkipIndexColMeta::MAX_SKIP_INDEX_COL_LENGTH;
 | |
|         }
 | |
|       }
 | |
|     } else {
 | |
|       null_count_arr_[i]++;
 | |
|     }
 | |
|   }
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::validate_agg_row(
 | |
|     const ObDatumRow &datum_row, int64_t nop_col_cnt, int64_t *nop_col_idxs)
 | |
| {
 | |
|   for (int64_t i = 0; i < full_agg_metas_.count(); ++i) {
 | |
|     ObSkipIndexColMeta idx_meta = full_agg_metas_.at(i);
 | |
|     const int64_t col_idx = idx_meta.col_idx_;
 | |
|     bool is_nop_column = is_col_in_nop_col_arr(col_idx, nop_col_cnt, nop_col_idxs);
 | |
|     if (is_nop_column) {
 | |
|       ASSERT_TRUE(datum_row.storage_datums_[i].is_nop());
 | |
|     } else {
 | |
|       ObStorageDatumCmpFunc cmp_func;
 | |
|       get_cmp_func(col_descs_.at(col_idx), cmp_func);
 | |
|       int cmp_ret = 0;
 | |
|       switch (idx_meta.col_type_) {
 | |
|       case SK_IDX_MIN: {
 | |
|         ASSERT_EQ(OB_SUCCESS, cmp_func.compare(
 | |
|             min_row_.storage_datums_[col_idx], datum_row.storage_datums_[i], cmp_ret));
 | |
|         ASSERT_EQ(0, cmp_ret);
 | |
|         break;
 | |
|       }
 | |
|       case SK_IDX_MAX: {
 | |
|         ASSERT_EQ(OB_SUCCESS, cmp_func.compare(
 | |
|             max_row_.storage_datums_[col_idx], datum_row.storage_datums_[i], cmp_ret));
 | |
|         ASSERT_EQ(0, cmp_ret);
 | |
|         break;
 | |
|       }
 | |
|       case SK_IDX_NULL_COUNT: {
 | |
|         ASSERT_EQ(null_count_arr_[col_idx], datum_row.storage_datums_[i].get_int());
 | |
|         break;
 | |
|       }
 | |
|       default:
 | |
|         // ERROR
 | |
|         ASSERT_TRUE(false);
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::set_nop_cols(
 | |
|     ObDatumRow &row, int64_t nop_col_cnt, int64_t *nop_col_idxs)
 | |
| {
 | |
|   for (int64_t i = 0; i < full_agg_metas_.count(); ++i) {
 | |
|     ASSERT_TRUE(i < row.get_column_count());
 | |
|     ObSkipIndexColMeta idx_meta = full_agg_metas_.at(i);
 | |
|     const int64_t col_idx = idx_meta.col_idx_;
 | |
|     if (is_col_in_nop_col_arr(col_idx, nop_col_cnt, nop_col_idxs)) {
 | |
|       row.storage_datums_[i].set_nop();
 | |
|     }
 | |
|   }
 | |
| }
 | |
| 
 | |
| bool TestIndexBlockAggregator::is_col_in_nop_col_arr(
 | |
|     const int64_t col_idx, const int64_t nop_col_cnt, int64_t *nop_col_idxs)
 | |
| {
 | |
|   bool is_nop_column = false;
 | |
|   for (int64_t i = 0; i < nop_col_cnt; ++i) {
 | |
|     if (col_idx == nop_col_idxs[i]) {
 | |
|       is_nop_column = true;
 | |
|       break;
 | |
|     }
 | |
|   }
 | |
|   return is_nop_column;
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::serialize_agg_row(
 | |
|     const ObDatumRow &agg_row, const char *&row_buf, int64_t &row_size)
 | |
| {
 | |
|   agg_row_writer_.reset();
 | |
|   char *buf = nullptr;
 | |
|   int64_t size = 0;
 | |
|   int64_t pos = 0;
 | |
|   ASSERT_EQ(OB_SUCCESS, agg_row_writer_.init(full_agg_metas_, agg_row, allocator_));
 | |
|   size = agg_row_writer_.get_data_size();
 | |
|   buf = static_cast<char *>(allocator_.alloc(size));
 | |
|   ASSERT_TRUE(nullptr != buf);
 | |
|   ASSERT_EQ(OB_SUCCESS, agg_row_writer_.write_agg_data(buf, size, pos));
 | |
|   row_buf = buf;
 | |
|   row_size = pos;
 | |
| }
 | |
| 
 | |
| void TestIndexBlockAggregator::get_cmp_func(const ObColDesc &col_desc, ObStorageDatumCmpFunc &cmp_func)
 | |
| {
 | |
|   sql::ObExprBasicFuncs *basic_funcs = ObDatumFuncs::get_basic_func(
 | |
|       col_desc.col_type_.get_type(), col_desc.col_type_.get_collation_type());
 | |
|   cmp_func.cmp_func_.cmp_func_ = lib::is_oracle_mode() ? basic_funcs->null_last_cmp_ : basic_funcs->null_first_cmp_;
 | |
| }
 | |
| 
 | |
| TEST_F(TestIndexBlockAggregator, basic_aggregate)
 | |
| {
 | |
|   const int64_t test_column_cnt = 24;
 | |
|   const int64_t test_row_cnt = 10;
 | |
|   const int64_t extra_rowkey_cnt = ObMultiVersionRowkeyHelpper::get_extra_rowkey_col_cnt();
 | |
|   ObObjType col_obj_types[24];
 | |
|   int64_t min_max_agg_col_idxs[24];
 | |
|   for (int64_t i = 0; i < test_column_cnt; ++i) {
 | |
|     col_obj_types[i] = static_cast<ObObjType>(i + 1);
 | |
|     const int64_t agg_col_idx = i < rowkey_count_ ? i : i + extra_rowkey_cnt;
 | |
|     min_max_agg_col_idxs[i] = agg_col_idx;
 | |
|   }
 | |
|   init_schema(test_column_cnt, col_obj_types);
 | |
|   init_skip_index_meta(test_column_cnt, min_max_agg_col_idxs);
 | |
| 
 | |
|   ObSkipIndexAggregator data_aggregator;
 | |
|   ObSkipIndexAggregator index_aggregator;
 | |
|   ObDatumRow data_agg_result;
 | |
|   ObDatumRow index_agg_result;
 | |
|   ASSERT_EQ(OB_SUCCESS, data_agg_result.init(full_agg_metas_.count()));
 | |
|   ASSERT_EQ(OB_SUCCESS, index_agg_result.init(full_agg_metas_.count()));
 | |
| 
 | |
|   for (int64_t test_round = 0; test_round < 7; ++test_round) {
 | |
|     reset_min_max_row();
 | |
|     data_agg_result.reuse();
 | |
|     index_agg_result.reuse();
 | |
|     ASSERT_EQ(OB_SUCCESS, data_aggregator.init(full_agg_metas_, col_descs_, true, data_agg_result, allocator_));
 | |
|     ASSERT_EQ(OB_SUCCESS, index_aggregator.init(full_agg_metas_, col_descs_, false, index_agg_result, allocator_));
 | |
| 
 | |
|     const ObDatumRow *data_agg_row = nullptr;
 | |
|     const ObDatumRow *index_agg_row = nullptr;
 | |
|     ObDatumRow generate_row;
 | |
|     ASSERT_EQ(OB_SUCCESS, generate_row.init(full_column_count_));
 | |
|     for (int64_t i = 0; i < test_row_cnt; ++i) {
 | |
|       const int64_t seed = random() % test_row_cnt;
 | |
|       generate_row_by_seed(seed, generate_row);
 | |
|       ASSERT_EQ(OB_SUCCESS, data_aggregator.eval(generate_row));
 | |
|       ASSERT_EQ(OB_SUCCESS, data_aggregator.get_aggregated_row(data_agg_row));
 | |
|       ASSERT_TRUE(nullptr != data_agg_row);
 | |
|       if (0 == test_row_cnt / 2) {
 | |
|         ASSERT_EQ(OB_SUCCESS, index_aggregator.eval(*data_agg_row));
 | |
|       } else {
 | |
|         const char *row_buf = nullptr;
 | |
|         int64_t row_size = 0;
 | |
|         serialize_agg_row(*data_agg_row, row_buf, row_size);
 | |
|         ASSERT_TRUE(nullptr != row_buf);
 | |
|         ASSERT_EQ(OB_SUCCESS, index_aggregator.eval(row_buf, row_size));
 | |
|       }
 | |
|       ASSERT_EQ(OB_SUCCESS, index_aggregator.get_aggregated_row(index_agg_row));
 | |
|       ASSERT_TRUE(nullptr != index_agg_row);
 | |
|       update_min_max_row(generate_row);
 | |
|       validate_agg_row(*data_agg_row);
 | |
|       validate_agg_row(*index_agg_row);
 | |
|     }
 | |
|     data_aggregator.reset();
 | |
|     index_aggregator.reset();
 | |
|   }
 | |
| 
 | |
|   // test nop agg
 | |
|   const int64_t nop_col_cnt = 3;
 | |
|   int64_t nop_col_idxs[nop_col_cnt] = {10, 13, 15};
 | |
|   reset_min_max_row();
 | |
|   data_agg_result.reuse();
 | |
|   index_agg_result.reuse();
 | |
|   ASSERT_EQ(OB_SUCCESS, data_aggregator.init(full_agg_metas_, col_descs_, true, data_agg_result, allocator_));
 | |
|   ASSERT_EQ(OB_SUCCESS, index_aggregator.init(full_agg_metas_, col_descs_, false, index_agg_result, allocator_));
 | |
|   const ObDatumRow *data_agg_row = nullptr;
 | |
|   const ObDatumRow *index_agg_row = nullptr;
 | |
|   ObDatumRow generate_row;
 | |
|   ASSERT_EQ(OB_SUCCESS, generate_row.init(full_column_count_));
 | |
|   for (int64_t i = 0; i < test_row_cnt; ++i) {
 | |
|     const int64_t seed = random() % test_row_cnt;
 | |
|     generate_row_by_seed(seed, generate_row);
 | |
|     ASSERT_EQ(OB_SUCCESS, data_aggregator.eval(generate_row));
 | |
|     ASSERT_EQ(OB_SUCCESS, data_aggregator.get_aggregated_row(data_agg_row));
 | |
|     ASSERT_TRUE(nullptr != data_agg_row);
 | |
|     set_nop_cols(*const_cast<ObDatumRow *>(data_agg_row), nop_col_cnt, nop_col_idxs);
 | |
|     ASSERT_EQ(OB_SUCCESS, index_aggregator.eval(*data_agg_row));
 | |
|     ASSERT_EQ(OB_SUCCESS, index_aggregator.get_aggregated_row(index_agg_row));
 | |
|     ASSERT_TRUE(nullptr != index_agg_row);
 | |
|     update_min_max_row(generate_row);
 | |
|     validate_agg_row(*data_agg_row, nop_col_cnt, nop_col_idxs);
 | |
|     validate_agg_row(*index_agg_row, nop_col_cnt, nop_col_idxs);
 | |
|   }
 | |
| 
 | |
|   // test reuse
 | |
|   reset_min_max_row();
 | |
|   data_agg_result.reuse();
 | |
|   index_agg_result.reuse();
 | |
|   data_aggregator.reuse();
 | |
|   index_aggregator.reuse();
 | |
|   data_agg_row = nullptr;
 | |
|   index_agg_row = nullptr;
 | |
|   for (int64_t i = 0; i < test_row_cnt; ++i) {
 | |
|     const int64_t seed = random() % test_row_cnt;
 | |
|     generate_row_by_seed(seed, generate_row);
 | |
|     ASSERT_EQ(OB_SUCCESS, data_aggregator.eval(generate_row));
 | |
|     ASSERT_EQ(OB_SUCCESS, data_aggregator.get_aggregated_row(data_agg_row));
 | |
|     ASSERT_TRUE(nullptr != data_agg_row);
 | |
|     set_nop_cols(*const_cast<ObDatumRow *>(data_agg_row), 0, nullptr);
 | |
|     ASSERT_EQ(OB_SUCCESS, index_aggregator.eval(*data_agg_row));
 | |
|     ASSERT_EQ(OB_SUCCESS, index_aggregator.get_aggregated_row(index_agg_row));
 | |
|     ASSERT_TRUE(nullptr != index_agg_row);
 | |
|     update_min_max_row(generate_row);
 | |
|     validate_agg_row(*data_agg_row, 0, nullptr);
 | |
|     validate_agg_row(*index_agg_row, 0, nullptr);
 | |
|   }
 | |
| 
 | |
| }
 | |
| 
 | |
| }
 | |
| }
 | |
| 
 | |
| int main(int argc, char **argv)
 | |
| {
 | |
|   system("rm -f test_index_block_aggregator.log*");
 | |
|   OB_LOGGER.set_file_name("test_index_block_aggregator.log", true, false);
 | |
|   oceanbase::common::ObLogger::get_logger().set_log_level("INFO");
 | |
|   testing::InitGoogleTest(&argc, argv);
 | |
|   return RUN_ALL_TESTS();
 | |
| } |