oceanbase/unittest/sql/engine/set/test_merge_set_op_vec.cpp
2023-01-28 20:40:16 +08:00

795 lines
29 KiB
C++

/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX SQL
#include <gtest/gtest.h>
#define private public
#define protected public
#include "sql/engine/set/ob_merge_union_op.h"
#include "sql/engine/set/ob_merge_intersect_op.h"
#include "sql/engine/set/ob_merge_except_op.h"
#include "sql/engine/aggregate/ob_merge_distinct_op.h"
#include "share/system_variable/ob_system_variable.h"
#include "storage/blocksstable/ob_data_file_prepare.h"
#include "sql/engine/table/ob_fake_table.h"
#include "set_data_op_generator.h"
#include "sql/ob_sql_init.h"
#include "share/ob_cluster_version.h"
#include "observer/omt/ob_tenant_config_mgr.h"
#include "share/datum/ob_datum_funcs.h"
namespace oceanbase
{
namespace sql
{
using namespace common;
using namespace share;
using namespace omt;
ObArenaAllocator allocator_;
ObExecContext exec_ctx_(allocator_);
ObEvalCtx op_eval_ctx_ = ObEvalCtx(exec_ctx_);
class MockSqlExpression : public ObSqlExpression
{
public:
MockSqlExpression(ObIAllocator &alloc): ObSqlExpression(alloc)
{
set_item_count(10);
}
};
#define TEST_SET_DUMP_GET_HASH_AREA_SIZE() (get_hash_area_size())
#define TEST_SET_DUMP_SET_HASH_AREA_SIZE(size) (set_hash_area_size(size))
const int64_t BATCH_SIZE = 256;
class ObMergeSetVecTest:
public blocksstable::TestDataFilePrepare, public ::testing::WithParamInterface<ObJoinType>
{
public:
typedef std::function<int64_t(const int64_t, const int64_t)> IdxCntFunc;
enum TestAlgo
{
UNION = 0,
INTERSECT,
EXCEPT,
DISTINCT
};
protected:
struct SetPlan
{
explicit SetPlan(ObExecContext &exec_ctx, const ObOpSpec &left_spec, const ObOpSpec &right_spec, ObOpInput *input)
: set_op_(nullptr), left_(exec_ctx, left_spec, input, ObString("LEFT_OP")), right_(exec_ctx, right_spec, input, ObString("RIGHT_OP")), expr_(exec_ctx.get_allocator())
{
}
int setup_plan(ObOperator *set_op);
ObSQLSessionInfo session_;
ObPhysicalPlan plan_;
ObOperator *set_op_;
SetDataGeneratorOp left_;
SetDataGeneratorOp right_;
MockSqlExpression expr_;
};
public:
ObMergeSetVecTest()
: blocksstable::TestDataFilePrepare("TestDiskIR", 8<<20, 5000), spec1_(exec_ctx_.get_allocator(), PHY_MERGE_INTERSECT),
spec2_(exec_ctx_.get_allocator(), PHY_MERGE_INTERSECT), spec3_(exec_ctx_.get_allocator(), PHY_MERGE_EXCEPT),
spec4_(exec_ctx_.get_allocator(), PHY_MERGE_EXCEPT), spec5_(exec_ctx_.get_allocator(), PHY_TABLE_SCAN), spec6_(exec_ctx_.get_allocator(), PHY_TABLE_SCAN),
spec7_(exec_ctx_.get_allocator(), PHY_MERGE_UNION), spec8_(exec_ctx_.get_allocator(), PHY_MERGE_UNION),
spec9_(exec_ctx_.get_allocator(), PHY_TABLE_SCAN), spec10_(exec_ctx_.get_allocator(), PHY_TABLE_SCAN),
spec11_(exec_ctx_.get_allocator(), PHY_MERGE_DISTINCT), spec12_(exec_ctx_.get_allocator(), PHY_MERGE_DISTINCT),
merge_intersect_vec_(exec_ctx_, spec1_, nullptr), merge_intersect_(exec_ctx_, spec2_, nullptr),
merge_except_vec_(exec_ctx_, spec3_, nullptr), merge_except_(exec_ctx_, spec4_, nullptr),
merge_union_vec_(exec_ctx_, spec7_, nullptr), merge_union_(exec_ctx_, spec8_, nullptr),
merge_distinct_vec_(exec_ctx_, spec11_, nullptr), merge_distinct_(exec_ctx_, spec12_, nullptr),
merge_set_op_vec_(nullptr), merge_set_op_(nullptr),
merge_plan_vec_(exec_ctx_, spec5_, spec6_, nullptr), merge_plan_(exec_ctx_, spec9_, spec10_, nullptr)
{
spec1_.batch_size_ = BATCH_SIZE;
spec2_.batch_size_ = 0;
spec3_.batch_size_ = BATCH_SIZE;
spec4_.batch_size_ = 0;
spec5_.batch_size_ = BATCH_SIZE;
spec6_.batch_size_ = BATCH_SIZE;
spec7_.batch_size_ = BATCH_SIZE;
spec8_.batch_size_ = 0;
spec9_.batch_size_ = 0;
spec10_.batch_size_ = 0;
spec11_.batch_size_ = BATCH_SIZE;
spec12_.batch_size_ = 0;
}
int init_tenant_mgr();
virtual void SetUp() override
{
ASSERT_EQ(OB_SUCCESS, init_tenant_mgr());
blocksstable::TestDataFilePrepare::SetUp();
ASSERT_EQ(OB_SUCCESS, blocksstable::ObTmpFileManager::get_instance().init());
CHUNK_MGR.set_limit(128L * 1024L * 1024L * 1024L);
GCONF.enable_sql_operator_dump.set_value("True");
uint64_t cluster_version = CLUSTER_VERSION_3000;
common::ObClusterVersion::get_instance().update_cluster_version(cluster_version);
EXPECT_EQ(cluster_version, common::ObClusterVersion::get_instance().get_cluster_version());
LOG_INFO("set cluster version", K(cluster_version),
K(common::ObClusterVersion::get_instance().get_cluster_version()));
}
virtual void TearDown() override
{
blocksstable::ObTmpFileManager::get_instance().destroy();
blocksstable::TestDataFilePrepare::TearDown();
destroy_tenant_mgr();
}
void destroy_tenant_mgr()
{
ObTenantManager::get_instance().destroy();
}
int64_t get_hash_area_size()
{
int64_t hash_area_size = 0;
int ret = OB_SUCCESS;
ret = ObSqlWorkareaUtil::get_workarea_size(HASH_WORK_AREA, OB_SYS_TENANT_ID, hash_area_size);
if (OB_FAIL(ret)) {
LOG_WARN("failed to get hash area size", K(ret), K(hash_area_size));
}
return hash_area_size;
}
void set_hash_area_size(int64_t size)
{
int ret = OB_SUCCESS;
int64_t tenant_id = OB_SYS_TENANT_ID;
ObTenantConfigGuard tenant_config(TENANT_CONF(tenant_id));
if (tenant_config.is_valid()) {
tenant_config->_hash_area_size = size;
} else {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected status: config is invalid", K(tenant_id));
}
// ASSERT_EQ(OB_SUCCESS, ret);
}
void setup_plan(SetPlan &plan, bool vec_algo, ObMergeSetVecTest::TestAlgo algo);
void setup_test(TestAlgo algo, int32_t string_size,
int64_t left_row_count, bool left_reverse, IdxCntFunc left_func,
int64_t right_row_count, bool right_reverse, IdxCntFunc right_func);
// iterate hash join result and verify result with merge join.
void run_test(int64_t print_row_cnt = 0);
int generate_merge_set_spec(ObMergeSetSpec &spec, bool is_vec)
{
int ret = OB_SUCCESS;
//spec.set_exprs_.set_allocator(&alloc_);
//spec.sort_cmp_funs_.set_allocator(&alloc_);
//spec.sort_collations_.set_allocator(&alloc_);
spec.set_exprs_.destroy();
spec.cost_ = 1;
spec.rows_ = 5000;
spec.width_ = 20;
spec.is_distinct_ = true;
if (OB_FAIL(spec.output_.init(3))) {
LOG_WARN("failed to init output_", K(ret));
return ret;
}
int pos1 = is_vec ? 2000000 : 5000000;
for (int i = 0; i < 3 ; ++i) {
ObExpr *expr = static_cast<ObExpr *> (alloc_.alloc(sizeof(ObExpr)));
if (OB_FAIL(spec.output_.push_back(expr))) {
LOG_WARN("failed to push back expr", K(ret));
return ret;
}
expr->batch_result_ = is_vec;
expr->batch_idx_mask_ = (expr->batch_result_ ? UINT64_MAX : 0);
expr->eval_batch_func_ = nullptr;
expr->eval_func_ = nullptr;
expr->frame_idx_ = 0;
expr->datum_off_ = pos1;
pos1 += sizeof(ObDatum) * op_eval_ctx_.max_batch_size_;
expr->eval_info_off_ = pos1;
pos1 += sizeof(ObEvalInfo);
expr->eval_flags_off_ = pos1;
pos1 += ObBitVector::memory_size(op_eval_ctx_.max_batch_size_);
expr->pvt_skip_off_ = pos1;
ObDatum *datums = expr->locate_batch_datums(op_eval_ctx_);
for (int64_t j = 0; j < op_eval_ctx_.max_batch_size_; j++) {
datums[j].ptr_ = op_eval_ctx_.frames_[0] + pos1;
pos1 += (3 == i ? 522 : 8);
}
}
if (OB_FAIL(spec.set_exprs_.init(3))) {
LOG_WARN("failed to get output exprs", K(ret), K(spec.set_exprs_.capacity_));
return ret;
}
pos1 = is_vec ? 6000000 : 7000000;
for (int i = 0; i < 3; ++i) {
ObExpr *expr = static_cast<ObExpr *>(alloc_.alloc(sizeof(ObExpr)));//新建expr, 设置expr对应的datum, 在对应位置放置datum
if (OB_FAIL(spec.set_exprs_.push_back(expr))) {
return ret;
}
//expr->batch_result_ = (spec.batch_size_ > 0);
//expr->batch_idx_mask_ = (expr->batch_result_ ? UINT64_MAX : 0);
expr->eval_batch_func_ = nullptr;
expr->eval_func_ = nullptr;
expr->frame_idx_ = 0;
expr->datum_off_ = pos1;
pos1 += sizeof(ObDatum) * op_eval_ctx_.max_batch_size_;
expr->eval_info_off_ = pos1;
pos1 += sizeof(ObEvalInfo);
expr->eval_flags_off_ = pos1;
pos1 += ObBitVector::memory_size(op_eval_ctx_.max_batch_size_);
expr->pvt_skip_off_ = pos1;
ObDatum *datums = expr->locate_batch_datums(op_eval_ctx_);
for (int64_t j = 0; j < op_eval_ctx_.max_batch_size_; j++) {
datums[j].ptr_ = op_eval_ctx_.frames_[0] + pos1;
pos1 += (3 == i ? 522 : 8);
}
}
if (OB_FAIL(spec.sort_collations_.init(1))) {
LOG_WARN("failed to init sort collations", K(ret));
} else if (OB_FAIL(spec.sort_cmp_funs_.init(1))) {
LOG_WARN("failed to compare function", K(ret));
} else {
LOG_WARN("init funcs");
// 初始化compare func和hash func
ObOrderDirection order_direction = default_asc_direction();
bool is_ascending = is_ascending_direction(order_direction);
ObSortFieldCollation field_collation(0,
CS_TYPE_BINARY,
is_ascending,
(is_null_first(order_direction) ^ is_ascending) ? NULL_LAST : NULL_FIRST);
if (OB_FAIL(spec.sort_collations_.push_back(field_collation))) {
LOG_WARN("failed to push back sort collation", K(ret));
}
ObSortCmpFunc cmp_func;
ObObjType tmp_type = ObIntType;
cmp_func.cmp_func_ = ObDatumFuncs::get_nullsafe_cmp_func(tmp_type,
tmp_type,
field_collation.null_pos_,
field_collation.cs_type_,
SCALE_UNKNOWN_YET,
lib::is_oracle_mode(),
false);
if (OB_FAIL(spec.sort_cmp_funs_.push_back(cmp_func))) {
LOG_WARN("failed to push back sort function", K(ret));
}
}
return ret;
}
int generate_merge_distinct_spec(ObMergeDistinctSpec &spec, bool is_vec)
{
int ret = OB_SUCCESS;
//spec.set_exprs_.set_allocator(&alloc_);
//spec.sort_cmp_funs_.set_allocator(&alloc_);
//spec.sort_collations_.set_allocator(&alloc_);
spec.distinct_exprs_.destroy();
spec.cost_ = 1;
spec.rows_ = 5000;
spec.width_ = 20;
if (OB_FAIL(spec.output_.init(3))) {
LOG_WARN("failed to init output_", K(ret));
return ret;
}
int pos1 = is_vec ? 2000000 : 5000000;
for (int i = 0; i < 3 ; ++i) {
ObExpr *expr = static_cast<ObExpr *> (alloc_.alloc(sizeof(ObExpr)));
if (OB_FAIL(spec.output_.push_back(expr))) {
LOG_WARN("failed to push back expr", K(ret));
return ret;
}
expr->batch_result_ = (spec.batch_size_ > 0);
expr->batch_idx_mask_ = (expr->batch_result_ ? UINT64_MAX : 0);
expr->eval_batch_func_ = nullptr;
expr->eval_func_ = nullptr;
expr->frame_idx_ = 0;
expr->datum_off_ = pos1;
pos1 += sizeof(ObDatum) * op_eval_ctx_.max_batch_size_;
expr->eval_info_off_ = pos1;
pos1 += sizeof(ObEvalInfo);
expr->eval_flags_off_ = pos1;
pos1 += ObBitVector::memory_size(op_eval_ctx_.max_batch_size_);
expr->pvt_skip_off_ = pos1;
ObDatum *datums = expr->locate_batch_datums(op_eval_ctx_);
for (int64_t j = 0; j < op_eval_ctx_.max_batch_size_; j++) {
datums[j].ptr_ = op_eval_ctx_.frames_[0] + pos1;
pos1 += (3 == i ? 522 : 8);
}
}
if (OB_FAIL(spec.distinct_exprs_.init(3))) {
LOG_WARN("failed to get output exprs", K(ret), K(spec.distinct_exprs_.capacity_));
return ret;
}
pos1 = is_vec ? 6000000 : 7000000;
for (int i = 0; i < 3; ++i) {
ObExpr *expr = static_cast<ObExpr *>(alloc_.alloc(sizeof(ObExpr)));//新建expr, 设置expr对应的datum, 在对应位置放置datum
if (OB_FAIL(spec.distinct_exprs_.push_back(expr))) {
return ret;
}
//expr->batch_result_ = (spec.batch_size_ > 0);
//expr->batch_idx_mask_ = (expr->batch_result_ ? UINT64_MAX : 0);
expr->eval_batch_func_ = nullptr;
expr->eval_func_ = nullptr;
expr->frame_idx_ = 0;
expr->datum_off_ = pos1;
pos1 += sizeof(ObDatum) * op_eval_ctx_.max_batch_size_;
expr->eval_info_off_ = pos1;
pos1 += sizeof(ObEvalInfo);
expr->eval_flags_off_ = pos1;
pos1 += ObBitVector::memory_size(op_eval_ctx_.max_batch_size_);
expr->pvt_skip_off_ = pos1;
ObDatum *datums = expr->locate_batch_datums(op_eval_ctx_);
for (int64_t j = 0; j < op_eval_ctx_.max_batch_size_; j++) {
datums[j].ptr_ = op_eval_ctx_.frames_[0] + pos1;
pos1 += (3 == i ? 522 : 8);
}
}
if (OB_FAIL(spec.cmp_funcs_.init(1))) {
LOG_WARN("failed to compare function", K(ret));
} else {
LOG_WARN("init funcs");
// 初始化compare func和hash func
ObOrderDirection order_direction = default_asc_direction();
bool is_ascending = is_ascending_direction(order_direction);
ObSortFieldCollation field_collation(0,
CS_TYPE_BINARY,
is_ascending,
(is_null_first(order_direction) ^ is_ascending) ? NULL_LAST : NULL_FIRST);
ObSortCmpFunc cmp_func;
ObObjType tmp_type = ObIntType;
cmp_func.cmp_func_ = ObDatumFuncs::get_nullsafe_cmp_func(tmp_type,
tmp_type,
field_collation.null_pos_,
field_collation.cs_type_,
SCALE_UNKNOWN_YET,
lib::is_oracle_mode(),
false);
if (OB_FAIL(spec.cmp_funcs_.push_back(cmp_func))) {
LOG_WARN("failed to push back sort function", K(ret));
}
}
return ret;
}
protected:
ObArenaAllocator alloc_;
ObMergeIntersectSpec spec1_;
ObMergeIntersectSpec spec2_;
ObMergeExceptSpec spec3_;
ObMergeExceptSpec spec4_;
SetDataGeneratorSpec spec5_;
SetDataGeneratorSpec spec6_;
ObMergeUnionSpec spec7_;
ObMergeUnionSpec spec8_;
SetDataGeneratorSpec spec9_;
SetDataGeneratorSpec spec10_;
ObMergeDistinctSpec spec11_;
ObMergeDistinctSpec spec12_;
ObMergeIntersectOp merge_intersect_vec_;
ObMergeIntersectOp merge_intersect_;
ObMergeExceptOp merge_except_vec_;
ObMergeExceptOp merge_except_;
ObMergeUnionOp merge_union_vec_;
ObMergeUnionOp merge_union_;
ObMergeDistinctOp merge_distinct_vec_;
ObMergeDistinctOp merge_distinct_;
ObOperator *merge_set_op_vec_;
ObOperator *merge_set_op_;
SetPlan merge_plan_vec_;
SetPlan merge_plan_;
};
int ObMergeSetVecTest::SetPlan::setup_plan(ObOperator *set_op)
{
int ret = OB_SUCCESS;
bool is_vec = (left_.get_spec().batch_size_ > 0);
bool is_distinct = (nullptr != dynamic_cast<ObMergeDistinctOp *> (set_op));
left_.init_expr(is_vec ? 0 : 8000000);
right_.init_expr(is_vec ? 0 : 8000000);
SetDataGeneratorSpec &left_spec = const_cast<SetDataGeneratorSpec &> (left_.get_spec());
SetDataGeneratorSpec &right_spec = const_cast<SetDataGeneratorSpec &> (right_.get_spec());
set_op_ = set_op;
ObOpSpec &set_op_spec = const_cast<ObOpSpec &> (set_op_->get_spec());
left_spec.id_ = 0;
right_spec.id_ = 1;
set_op_spec.id_ = 2;
//LOG_WARN("value:", K(left_spec), K(right_spec));
//set_op_->set_column_count(SetDataGenerator::CELL_CNT * 2); 没有的参数
left_spec.plan_=&plan_;
right_spec.plan_=&plan_;
set_op_spec.plan_=&plan_;
set_op_->ctx_.set_my_session(&session_);
set_op_->ctx_.init_phy_op(is_distinct ? 2 : 3);
set_op_->ctx_.create_physical_plan_ctx();
ObOperator **children_ptr = static_cast<ObOperator **>(exec_ctx_.get_allocator().alloc(sizeof(ObOperator *) * (is_distinct ? 1 : 2)));
ObOpSpec **spec_children_ptr = static_cast<ObOpSpec **>(exec_ctx_.get_allocator().alloc(sizeof(ObOpSpec *) * (is_distinct ? 1 : 2)));
if (OB_ISNULL(children_ptr)) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("alloc for children_ptr failed ", K(ret));
} else if (OB_ISNULL(spec_children_ptr)) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("alloc for spec_children_ptr falied", K(ret));
} else {
children_ptr[0] = static_cast<ObOperator *>(&left_);
spec_children_ptr[0] = static_cast<ObOpSpec *>(&left_spec);
if (!is_distinct) {
children_ptr[1] = static_cast<ObOperator *>(&right_);
spec_children_ptr[1] = static_cast<ObOpSpec *>(&right_spec);
}
}
if (OB_FAIL(set_op_->set_children_pointer(children_ptr, (is_distinct ? 1 : 2)))) {
LOG_WARN("failed to set children for set op", K(ret));
} else if (OB_FAIL(set_op_spec.set_children_pointer(spec_children_ptr, (is_distinct ? 1 : 2)))) {
LOG_WARN("failed to set spec children for set op", K(ret));
}
//set_op_->set_distinct(true); 没有的参数
// setup context
ObString tenant_name("test");
if (OB_FAIL(ret)) {
} else if (OB_FAIL(session_.test_init(0, 0, 0, NULL))) {
} else if (OB_FAIL(ObPreProcessSysVars::init_sys_var())) {
} else if (OB_FAIL(session_.load_default_sys_variable(false, true))) {
} else if (OB_FAIL(session_.init_tenant(tenant_name, OB_SYS_TENANT_ID))) {
} else if (FALSE_IT(exec_ctx_.set_my_session(&session_))) {
} else if (OB_FAIL(exec_ctx_.init_phy_op((is_distinct ? 2 : 3)))) {
} else if (OB_FAIL(exec_ctx_.create_physical_plan_ctx())) {
}
LOG_WARN("value:", K(left_spec), K(right_spec), K(set_op_spec));
return ret;
}
void ObMergeSetVecTest::setup_plan(SetPlan &plan, bool vec_algo, ObMergeSetVecTest::TestAlgo algo)
{
int ret = OB_SUCCESS;
switch (algo)
{
case UNION:
if (vec_algo) {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_union_vec_));
merge_set_op_vec_ = &merge_union_vec_;
ObMergeSetSpec &merge_spec = static_cast<ObMergeSetSpec &>(const_cast<ObOpSpec &> (merge_set_op_vec_->get_spec()));
if (OB_FAIL(generate_merge_set_spec(merge_spec, true))) {
LOG_WARN("failed to generate merge_set_spec", K(ret));
} else {
LOG_WARN("success to generate merge_set_spec", K(ret));
}
} else {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_union_));
merge_set_op_ = &merge_union_;
ObMergeSetSpec &merge_spec = static_cast<ObMergeSetSpec &>(const_cast<ObOpSpec &> (merge_set_op_->get_spec()));
if (OB_FAIL(generate_merge_set_spec(merge_spec, false))) {
LOG_WARN("failed to generate merge_set_spec", K(ret));
} else {
LOG_WARN("success to generate merge_set_spec", K(ret));
}
}
break;
case INTERSECT:
if (vec_algo) {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_intersect_vec_));
merge_set_op_vec_ = &merge_intersect_vec_;
ObMergeSetSpec &merge_spec = static_cast<ObMergeSetSpec &>(const_cast<ObOpSpec &> (merge_set_op_vec_->get_spec()));
if (OB_FAIL(generate_merge_set_spec(merge_spec, true))) {
LOG_WARN("failed to generate merge_set_spec", K(ret));
} else {
LOG_WARN("success to generate merge_set_spec", K(ret));
}
} else {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_intersect_));
merge_set_op_ = &merge_intersect_;
ObMergeSetSpec &merge_spec = static_cast<ObMergeSetSpec &>(const_cast<ObOpSpec &> (merge_set_op_->get_spec()));
if (OB_FAIL(generate_merge_set_spec(merge_spec, false))) {
LOG_WARN("failed to generate merge_set_spec", K(ret));
} else {
LOG_WARN("success to generate merge_set_spec", K(ret));
}
}
break;
case EXCEPT:
if (vec_algo) {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_except_vec_));
merge_set_op_vec_ = &merge_except_vec_;
ObMergeSetSpec &merge_spec = static_cast<ObMergeSetSpec &>(const_cast<ObOpSpec &> (merge_set_op_vec_->get_spec()));
generate_merge_set_spec(merge_spec, true);
} else {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_except_));
merge_set_op_ = &merge_except_;
ObMergeSetSpec &merge_spec = static_cast<ObMergeSetSpec &>(const_cast<ObOpSpec &> (merge_set_op_->get_spec()));
generate_merge_set_spec(merge_spec, false);
}
break;
case DISTINCT:
if (vec_algo) {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_distinct_vec_));
merge_set_op_vec_ = &merge_distinct_vec_;
ObMergeDistinctSpec &merge_spec = static_cast<ObMergeDistinctSpec &>(const_cast<ObOpSpec &> (merge_set_op_vec_->get_spec()));
generate_merge_distinct_spec(merge_spec, true);
} else {
ASSERT_EQ(OB_SUCCESS, plan.setup_plan(&merge_distinct_));
merge_set_op_ = &merge_distinct_;
ObMergeDistinctSpec &merge_spec = static_cast<ObMergeDistinctSpec &>(const_cast<ObOpSpec &> (merge_set_op_->get_spec()));
generate_merge_distinct_spec(merge_spec, false);
}
break;
default:
break;
}
}
void ObMergeSetVecTest::setup_test(TestAlgo algo, int32_t string_size,
int64_t left_row_count, bool left_reverse, IdxCntFunc left_func,
int64_t right_row_count, bool right_reverse, IdxCntFunc right_func)
{
SetPlan *plans[] = { &merge_plan_vec_, &merge_plan_ };
for (int i = 0; i < 2; i++) {
auto &plan = *plans[i];
setup_plan(plan, i == 0 ? true : false, algo);
plan.left_.row_cnt_ = left_row_count;
plan.right_.row_cnt_ = right_row_count;
plan.left_.string_size_ = string_size;
plan.right_.string_size_ = string_size;
UNUSED(left_reverse);
UNUSED(left_func);
UNUSED(right_reverse);
UNUSED(right_func);
/*if (&plan != &merge_plan_) {
plan.left_.reverse_ = left_reverse;
plan.right_.reverse_ = right_reverse;
}*/
//plan.left_.idx_cnt_func_ = left_func;
//plan.right_.idx_cnt_func_ = right_func;
ASSERT_EQ(OB_SUCCESS, plan.left_.test_init());
ASSERT_EQ(OB_SUCCESS, plan.right_.test_init());
}
}
void ObMergeSetVecTest::run_test(int64_t print_row_cnt)
{
UNUSED(print_row_cnt);
ObArenaAllocator alloc;
typedef ObArray<int64_t *> ResArray;
int64_t res_cell_cnt = 1;
const ObBatchRows * child_brs = nullptr;
auto fun_batch = [&](SetPlan &plan, ResArray &res)->void
{
spec5_.batch_size_ = BATCH_SIZE;
spec6_.batch_size_ = BATCH_SIZE;
ASSERT_EQ(OB_SUCCESS, plan.set_op_->open());
int ret = OB_SUCCESS;
while (OB_SUCC(ret)) {
ret = plan.set_op_->get_next_batch(BATCH_SIZE, child_brs);
ASSERT_EQ(OB_SUCCESS, ret);
if (child_brs->end_ && 0 == child_brs->size_) {
ret = OB_ITER_END;
} else {
auto &c = plan.set_op_->get_spec().output_[0];
ObDatum *result = c->locate_batch_datums(op_eval_ctx_);
for (int64_t j = 0; j < child_brs->size_; ++j) {
if (child_brs->skip_->at(j)) {
continue;
}
auto r = static_cast<int64_t *>(alloc.alloc(sizeof(int64_t) * res_cell_cnt));
ASSERT_TRUE(NULL != r);
for (int64_t i = 0; i < res_cell_cnt; i++) {
ObDatum &dtm = result[j];
r[i] = dtm.get_int();
}
ASSERT_EQ(OB_SUCCESS, res.push_back(r));
}
}
}
};
auto fun = [&](SetPlan &plan, ResArray &res)->void
{
spec5_.batch_size_ = 0;
spec6_.batch_size_ = 0;
ASSERT_EQ(OB_SUCCESS, plan.set_op_->open());
int ret = OB_SUCCESS;
const ObNewRow *row = NULL;
int64_t cnt = 0;
while (OB_SUCC(ret)) {
if (OB_FAIL(plan.set_op_->get_next_row())) {
ASSERT_EQ(OB_ITER_END, ret);
} else {
auto r = static_cast<int64_t *>(alloc.alloc(sizeof(int64_t) * res_cell_cnt));
ASSERT_TRUE(NULL != r);
for (int64_t i = 0; i < res_cell_cnt; i++) {
auto &c = plan.set_op_->get_spec().output_[0];
ObDatum &dtm = c->locate_expr_datum(op_eval_ctx_);
r[i] = dtm.get_int();
}
ASSERT_EQ(OB_SUCCESS, res.push_back(r));
}
cnt++;
}
};
auto pfunc = [&](int64_t *r)
{
ObSqlString s;
for (int64_t i = 0; i < res_cell_cnt; i++) {
s.append_fmt("%ld, ", r[i]);
}
LOG_INFO("RES:", K(s.ptr()));
};
ResArray merge_res_vec;
fun_batch(merge_plan_vec_, merge_res_vec);
ASSERT_FALSE(HasFatalFailure());
ResArray merge_res;
fun(merge_plan_, merge_res);
LOG_WARN("bp4");
ASSERT_FALSE(HasFatalFailure());
ASSERT_EQ(merge_res_vec.count(), merge_res.count());
auto sort_cmp = [&](int64_t *l, int64_t *r)
{
for (int64_t i = 0; i < res_cell_cnt; i++) {
if (l[i] != r[i]) {
return l[i] < r[i];
}
}
return false;
};
LOG_WARN("bp5", K(merge_res_vec.count()));
std::sort(&merge_res_vec.at(0), &merge_res_vec.at(0) + merge_res_vec.count(), sort_cmp);
LOG_WARN("bp6", K(merge_res.count()));
std::sort(&merge_res.at(0), &merge_res.at(0) + merge_res.count(), sort_cmp);
for (int64_t i = 0; i < merge_res_vec.count(); i++) {
ASSERT_EQ(*merge_res.at(i), *merge_res_vec.at(i));
}
merge_set_op_vec_->close();
merge_set_op_->close();
merge_plan_vec_.~SetPlan();
merge_plan_.~SetPlan();
ASSERT_EQ(OB_SUCCESS, blocksstable::ObTmpFileManager::get_instance().files_.map_.size());
}
int ObMergeSetVecTest::init_tenant_mgr()
{
int ret = OB_SUCCESS;
ObTenantManager &tm = ObTenantManager::get_instance();
ObAddr self;
oceanbase::rpc::frame::ObReqTransport req_transport(NULL, NULL);
oceanbase::obrpc::ObSrvRpcProxy rpc_proxy;
oceanbase::obrpc::ObCommonRpcProxy rs_rpc_proxy;
oceanbase::share::ObRsMgr rs_mgr;
uint64_t cluster_version = CLUSTER_VERSION_3000;
common::ObClusterVersion::get_instance().update_cluster_version(cluster_version);
EXPECT_EQ(cluster_version, common::ObClusterVersion::get_instance().get_cluster_version());
int64_t tenant_id = OB_SYS_TENANT_ID;
self.set_ip_addr("127.0.0.1", 8086);
ret = ObTenantConfigMgr::get_instance().add_tenant_config(tenant_id);
EXPECT_EQ(OB_SUCCESS, ret);
ret = tm.init(self, rpc_proxy, rs_rpc_proxy, rs_mgr, &req_transport, &ObServerConfig::get_instance());
EXPECT_EQ(OB_SUCCESS, ret);
ret = tm.add_tenant(tenant_id);
EXPECT_EQ(OB_SUCCESS, ret);
ret = tm.set_tenant_mem_limit(tenant_id,
4L * 1024L * 1024L * 1024L, 8L * 1024L * 1024L * 1024L);
EXPECT_EQ(OB_SUCCESS, ret);
ret = tm.add_tenant(OB_SERVER_TENANT_ID);
EXPECT_EQ(OB_SUCCESS, ret);
const int64_t ulmt = 256LL << 30;
const int64_t llmt = 256LL << 30;
ret = tm.set_tenant_mem_limit(OB_SYS_TENANT_ID, ulmt, llmt);
EXPECT_EQ(OB_SUCCESS, ret);
ret = tm.set_tenant_mem_limit(OB_SERVER_TENANT_ID, ulmt, llmt);
EXPECT_EQ(OB_SUCCESS, ret);
auto ctx_allocator =
lib::ObMallocAllocator::get_instance()->get_tenant_ctx_allocator(
OB_SERVER_TENANT_ID, common::ObCtxIds::DEFAULT_CTX_ID);
EXPECT_EQ(OB_SUCCESS, ret);
ret = ctx_allocator->set_limit(8L * 1024L * 1024L * 1024L);
EXPECT_EQ(OB_SUCCESS, ret);
oceanbase::lib::set_memory_limit(128LL << 32);
return ret;
}
/*TEST_F(ObMergeSetVecTest, test_intersect_dump)
{
setup_test(ObMergeSetVecTest::TestAlgo::INTERSECT, 512,
200000*3, false, [](int64_t id, int64_t) { return id % 3 == 0 ? 1 : 0; },
200000*3, false, [](int64_t id, int64_t) { return id % 5 == 0 ? 1 : 0; });
ASSERT_FALSE(HasFatalFailure());
run_test();
ASSERT_FALSE(HasFatalFailure());
}
TEST_F(ObMergeSetVecTest, test_except_dump)
{
setup_test(ObMergeSetVecTest::TestAlgo::EXCEPT, 512,
200000 * 3, false, [](int64_t id, int64_t) { return id % 3 == 0 ? 1 : 0; },
200000 * 3, false, [](int64_t id, int64_t) { return id % 5 == 0 ? 1 : 0; });
ASSERT_FALSE(HasFatalFailure());
run_test();
ASSERT_FALSE(HasFatalFailure());
}*/
TEST_F(ObMergeSetVecTest, test_union_dump)
{
setup_test(ObMergeSetVecTest::TestAlgo::UNION, 512,
200000 * 3 , false, [](int64_t id, int64_t) { return id % 3 == 0 ? 1 : 0; },
200000 * 3 , false, [](int64_t id, int64_t) { return id % 5 == 0 ? 1 : 0; });
ASSERT_FALSE(HasFatalFailure());
run_test();
ASSERT_FALSE(HasFatalFailure());
}
/*TEST_F(ObMergeSetVecTest, test_distinct_dump)
{
setup_test(ObMergeSetVecTest::TestAlgo::DISTINCT, 512,
200000 * 3 , false, [](int64_t id, int64_t) { return id % 3 == 0 ? 1 : 0; },
200000 * 3 , false, [](int64_t id, int64_t) { return id % 5 == 0 ? 1 : 0; });
ASSERT_FALSE(HasFatalFailure());
run_test();
ASSERT_FALSE(HasFatalFailure());
}*/
} // end sql
} // end oceanbase
int main(int argc, char **argv)
{
exec_ctx_.eval_ctx_ = &op_eval_ctx_;
op_eval_ctx_.max_batch_size_ = 256;
op_eval_ctx_.frames_ = static_cast<char **>(exec_ctx_.get_allocator().alloc(sizeof(void *) * 2));
op_eval_ctx_.frames_[0] = (char *)exec_ctx_.get_allocator().alloc(10000000);
oceanbase::sql::init_sql_factories();
OB_LOGGER.set_log_level("INFO");
::testing::InitGoogleTest(&argc,argv);
int ret = RUN_ALL_TESTS();
OB_LOGGER.disable();
return ret;
}