Files
oceanbase/unittest/sql/engine/set/set_data_op_generator.h
wangzelin.wzl 93a1074b0c patch 4.0
2022-10-24 17:57:12 +08:00

281 lines
8.3 KiB
C++

/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#ifndef OCEANBASE_SET_DATA_GENERATOR_OP_H_
#define OCEANBASE_SET_DATA_GENERATOR_OP_H_
#include <functional>
#include "sql/engine/ob_operator.h"
#include "sql/engine/set/ob_hash_set_op.h"
#include "sql/engine/ob_exec_context.h"
#include "lib/container/ob_array.h"
#include "common/row/ob_row_desc.h"
#include "common/rowkey/ob_rowkey.h"
#include "lib/utility/ob_hang_fatal_error.h"
#include "sql/engine/px/ob_px_util.h"
#include "sql/engine/basic/ob_hash_partitioning_infrastructure_op.h"
const int LEFT_HASH_SEED = 1000000007;
const int RIGHT_HASH_SEED = 100007;
namespace oceanbase
{
namespace sql
{
class SetDataGeneratorSpec;
class SetDataGeneratorOp;
static const SetDataGeneratorSpec &get_my_spec(const SetDataGeneratorOp &op);
class SetDataGeneratorSpec : public ObOpSpec
{
OB_UNIS_VERSION_V(1);
public:
SetDataGeneratorSpec(common::ObIAllocator &alloc, const ObPhyOperatorType type) : ObOpSpec(alloc, type)
{
}
};
OB_SERIALIZE_MEMBER((SetDataGeneratorSpec, ObOpSpec));
class SetDataGeneratorOp : public ObOperator
{
public:
SetDataGeneratorOp(ObExecContext &exec_ctx, const ObOpSpec &spec, ObOpInput *input, ObString op_id)
: ObOperator(exec_ctx, spec, input), op_id_(op_id)
{
for (int i = 0; i != 1000; ++i) {
str_buf_[i] = 's';
}
}
//void set_column_num(const int num) { columns_num_ = num; } 暂定3列
int test_init()
{
int ret = OB_SUCCESS;
//set_column_count(columns_num_);
row_id_ = 0;
return ret;
}
void destroy()
{
ObOperator::destroy();
}
/*int open()
{
int ret = OB_SUCCESS;
opened_ = true;
return ret;
}*/
int convert_row(
const common::ObIArray<ObExpr *> &src_exprs, const common::ObIArray<ObExpr *> &dst_exprs)
{
int ret = OB_SUCCESS;
if (dst_exprs.count() != src_exprs.count()) {
ret = OB_ERR_UNEXPECTED;
OB_LOG(WARN, "unexpected status: exprs is not match", K(ret), K(src_exprs.count()),
K(dst_exprs.count()));
} else {
// do nothing
}
return ret;
}
void init_expr(int64_t init_pos)
{
int64_t pos = init_pos;
if (op_id_ == ObString("RIGHT_OP")) {
pos += 1000000;
}
if (cells_.count() == 0) {
for (int64_t i = 0; i < columns_num_; ++i) {
ObExpr *expr = static_cast<ObExpr*>(alloc_.alloc(sizeof(ObExpr)));
ASSERT_EQ(OB_SUCCESS, cells_.push_back(expr));
expr->frame_idx_ = 0;
expr->datum_off_ = pos;
pos += sizeof(ObDatum) * eval_ctx_.max_batch_size_;
expr->eval_info_off_ = pos;
pos += sizeof(ObEvalInfo);
expr->eval_flags_off_ = pos;
pos += ObBitVector::memory_size(eval_ctx_.max_batch_size_);
expr->pvt_skip_off_ = pos;
expr->batch_result_ = (spec_.batch_size_ > 0);
expr->batch_idx_mask_ = (expr->batch_result_ ? UINT64_MAX : 0);
expr->datum_meta_.type_ = ObIntType;
ObDatum *datums = expr->locate_batch_datums(eval_ctx_);
for (int64_t j = 0; j < eval_ctx_.max_batch_size_; j++) {
datums[j].ptr_ = eval_ctx_.frames_[0] + pos;
pos += (3 == i ? 522 : 8);
}
}
}
SetDataGeneratorSpec &op_spec = const_cast<SetDataGeneratorSpec &> (get_spec());
if (op_spec.output_.count() == 0) {
ASSERT_EQ(OB_SUCCESS, op_spec.output_.init(3));
for (int64_t i = 0; i < columns_num_; ++i) {
ObExpr *expr = cells_[i];
ASSERT_EQ(OB_SUCCESS, op_spec.output_.push_back(expr));
}
}
}
void gen_row(int64_t row_id)
{
ObDatum *expr_datum_0 = &cells_.at(0)->locate_expr_datum(eval_ctx_);
int id = row_id / 2;
int key = id * 100 + static_cast<int>(static_cast<int64_t>(hash(id)) % 91);
expr_datum_0->set_int(key);
cells_.at(0)->get_eval_info(eval_ctx_).evaluated_ = true;
/*int64_t max_size = 512;
if (enable_big_row_ && row_id > 0 && random() % 100000 < 5) {
max_size = 1 << 20;
}*/
ObDatum *expr_datum_1 = &cells_.at(1)->locate_expr_datum(eval_ctx_);
expr_datum_1->set_null();
cells_.at(1)->get_eval_info(eval_ctx_).evaluated_ = true;
int64_t size = 300;
ObDatum *expr_datum_2 = &cells_.at(2)->locate_expr_datum(eval_ctx_);
expr_datum_2->set_string(str_buf_, (int)size);
cells_.at(2)->get_eval_info(eval_ctx_).evaluated_ = true;
}
void gen_batch(int64_t &row_id, const int64_t batch_size)
{
ObEvalCtx::BatchInfoScopeGuard guard(eval_ctx_);
guard.set_batch_idx(0);
ObDatumVector datum0 = cells_.at(0)->locate_expr_datumvector(eval_ctx_);
ObDatumVector datum1 = cells_.at(1)->locate_expr_datumvector(eval_ctx_);
ObDatumVector datum2 = cells_.at(2)->locate_expr_datumvector(eval_ctx_);
for (int64_t i = 0; i < batch_size; ++i) {
int id = (row_id + i) / 2;
int key = (id) * 100 + static_cast<int>(static_cast<int64_t>(hash((id))) % 91);
datum0.at(i).set_int(key);
cells_.at(0)->get_eval_info(eval_ctx_).evaluated_ = true;
datum1.at(i).set_null();
cells_.at(1)->get_eval_info(eval_ctx_).evaluated_ = true;
int64_t size = 300;
datum2.at(i).set_string(str_buf_, (int)size);
cells_.at(2)->get_eval_info(eval_ctx_).evaluated_ = true;
}
if (row_id + batch_size <= row_cnt_) {
brs_.size_ = batch_size;
row_id += batch_size;
} else {
brs_.size_ = row_cnt_ - row_id;
row_id += brs_.size_;
}
}
uint64_t hash(int64_t value)
{
uint64_t seed = 0;
if (op_id_ == ObString("RIGHT_OP")) {
seed =static_cast<uint64_t>(RIGHT_HASH_SEED);
} else {
seed = static_cast<uint64_t>(LEFT_HASH_SEED);
}
uint64_t res = (value * seed);
return res;
}
/*int inner_get_next_row()
{
int ret = OB_SUCCESS;
gen_row(row_cnt_);
if (row_cnt_ <= 0) {
return iter_end_ret_;
} else if (OB_FAIL(convert_row(cells_, MY_SPEC.output_))) { //将cur_expr写入到output中
OB_LOG(WARN, "copy current row failed", K(ret));
} else {
row_cnt_--;
}
char *frame = eval_ctx_.frames_[0];
ObDatum *tmp_datum = (ObDatum *)(frame + 72);
return ret;
}*/
int inner_get_next_row()
{
static int add =0;
int ret = OB_SUCCESS;
gen_row(row_id_);
if (row_id_ < 0 || row_id_ >= row_cnt_) {
return iter_end_ret_;
} else if (OB_FAIL(convert_row(cells_, MY_SPEC.output_))) { //将cur_expr写入到output中
OB_LOG(WARN, "copy current row failed", K(ret));
} else {
++add;
++row_id_;
}
char *frame = eval_ctx_.frames_[0];
ObDatum *tmp_datum = (ObDatum *)(frame + 72);
return ret;
}
int inner_get_next_batch(const int64_t max_row_cnt)
{
int ret = OB_SUCCESS;
gen_batch(row_id_, max_row_cnt);
if (row_id_ < 0 || row_id_ >= row_cnt_) {
brs_.end_ = true;
}
return ret;
}
const SetDataGeneratorSpec &get_spec() const
{
return static_cast<const SetDataGeneratorSpec &>(spec_);
}
int64_t row_cnt_ = 1;
int string_size_ = 64;
typedef std::function<int64_t(const int64_t, const int64_t)> IdxCntFunc;
IdxCntFunc idx_cnt_func_ = [](const int64_t, const int64_t) { return 1; };
typedef std::function<int64_t(const int64_t)> IdValFunc;
IdValFunc row_id_val_ = [](const int64_t v) { return v; };
IdValFunc idx_val_ = [](const int64_t v) { return v; };
int iter_end_ret_ = OB_ITER_END;
const static int columns_num_=3;
private:
ObString op_id_;
int64_t row_id_ = 0;
ObSEArray<ObExpr *, columns_num_> cells_;
ObSEArray<ObExpr *, columns_num_> ver_cells_;
const static int64_t BUF_SIZE = 2 << 20;
char str_buf_[BUF_SIZE];
bool enable_big_row_ = false;
ObArenaAllocator alloc_;
ObArenaAllocator eval_res_;
ObArenaAllocator eval_tmp_;
ObExecContext exec_ctx_;
//ObEvalCtx eval_ctx_;
};
const static SetDataGeneratorSpec &get_my_spec(const SetDataGeneratorOp &op)
{
return op.get_spec();
}
} // end sql
} // end oceanbase
#endif // OCEANBASE_SET_DATA_GENERATOR_OP_H_