
Co-authored-by: wxhwang <wxhwang@126.com> Co-authored-by: godyangfight <godyangfight@gmail.com> Co-authored-by: Tyshawn <tuyunshan@gmail.com>
373 lines
13 KiB
C++
373 lines
13 KiB
C++
/**
|
|
* Copyright (c) 2021 OceanBase
|
|
* OceanBase CE is licensed under Mulan PubL v2.
|
|
* You can use this software according to the terms and conditions of the Mulan PubL v2.
|
|
* You may obtain a copy of Mulan PubL v2 at:
|
|
* http://license.coscl.org.cn/MulanPubL-2.0
|
|
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
|
|
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
|
|
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
|
|
* See the Mulan PubL v2 for more details.
|
|
*/
|
|
|
|
#define USING_LOG_PREFIX STORAGE
|
|
|
|
#include <gtest/gtest.h>
|
|
#define protected public
|
|
#define private public
|
|
#include "storage/blocksstable/encoding/ob_micro_block_encoder.h"
|
|
#include "storage/blocksstable/encoding/ob_micro_block_decoder.h"
|
|
#include "storage/ob_i_store.h"
|
|
#include "lib/string/ob_sql_string.h"
|
|
#include "../ob_row_generate.h"
|
|
#include "common/rowkey/ob_rowkey.h"
|
|
#include "share/ob_cluster_version.h"
|
|
|
|
namespace oceanbase
|
|
{
|
|
namespace blocksstable
|
|
{
|
|
|
|
using namespace common;
|
|
using namespace storage;
|
|
using namespace share::schema;
|
|
|
|
enum EncodeTestCase
|
|
{
|
|
FORCE_RAW_ON_SPAN_COLUMN_WITH_NULL,
|
|
MAX_TEST_CASE,
|
|
};
|
|
|
|
class TestIColumnEncoder : public ::testing::Test
|
|
{
|
|
public:
|
|
TestIColumnEncoder(const bool is_multi_version_row = false)
|
|
: is_multi_version_row_(is_multi_version_row), tenant_ctx_(OB_SERVER_TENANT_ID)
|
|
{
|
|
share::ObTenantEnv::set_tenant(&tenant_ctx_);
|
|
}
|
|
virtual ~TestIColumnEncoder() {}
|
|
virtual void SetUp();
|
|
virtual void TearDown() {}
|
|
|
|
protected:
|
|
int64_t rowkey_cnt_;
|
|
int64_t column_cnt_;
|
|
ObObjType *col_types_;
|
|
ObRowGenerate row_generate_;
|
|
ObMicroBlockEncodingCtx ctx_;
|
|
ObRowkeyReadInfo read_info_;
|
|
ObArenaAllocator allocator_;
|
|
common::ObArray<share::schema::ObColDesc> col_descs_;
|
|
bool is_multi_version_row_;
|
|
share::ObTenantBase tenant_ctx_;
|
|
};
|
|
|
|
void TestIColumnEncoder::SetUp()
|
|
{
|
|
oceanbase::ObClusterVersion::get_instance().update_data_version(DATA_CURRENT_VERSION);
|
|
const int64_t tid = 200001;
|
|
ObTableSchema table;
|
|
ObColumnSchemaV2 col;
|
|
table.reset();
|
|
table.set_tenant_id(1);
|
|
table.set_tablegroup_id(1);
|
|
table.set_database_id(1);
|
|
table.set_table_id(tid);
|
|
table.set_table_name("test_micro_decoder_schema");
|
|
table.set_rowkey_column_num(rowkey_cnt_);
|
|
table.set_max_column_id(column_cnt_ * 2);
|
|
|
|
ObSqlString str;
|
|
for (int64_t i = 0; i < column_cnt_; ++i) {
|
|
col.reset();
|
|
col.set_table_id(tid);
|
|
col.set_column_id(i + OB_APP_MIN_COLUMN_ID);
|
|
str.assign_fmt("test%ld", i);
|
|
col.set_column_name(str.ptr());
|
|
ObObjType type = col_types_[i];
|
|
col.set_data_type(type);
|
|
col.set_collation_type(CS_TYPE_UTF8MB4_GENERAL_CI);
|
|
if (type == ObIntType) {
|
|
col.set_rowkey_position(1);
|
|
} else{
|
|
col.set_rowkey_position(0);
|
|
}
|
|
ASSERT_EQ(OB_SUCCESS, table.add_column(col));
|
|
}
|
|
|
|
ASSERT_EQ(OB_SUCCESS, row_generate_.init(table, is_multi_version_row_));
|
|
if (is_multi_version_row_) {
|
|
ASSERT_EQ(OB_SUCCESS, row_generate_.get_schema().get_multi_version_column_descs(col_descs_));
|
|
} else {
|
|
ASSERT_EQ(OB_SUCCESS, row_generate_.get_schema().get_column_ids(col_descs_));
|
|
}
|
|
ASSERT_EQ(OB_SUCCESS, read_info_.init(allocator_,
|
|
row_generate_.get_schema().get_column_count(),
|
|
row_generate_.get_schema().get_rowkey_column_num(),
|
|
lib::is_oracle_mode(),
|
|
col_descs_));
|
|
|
|
ctx_.micro_block_size_ = 1L << 20; // 1MB, maximum micro block size;
|
|
ctx_.macro_block_size_ = 2L << 20;
|
|
ctx_.rowkey_column_cnt_ = rowkey_cnt_;
|
|
ctx_.column_cnt_ = is_multi_version_row_ ? column_cnt_ + 2 : column_cnt_;
|
|
ctx_.col_descs_ = &col_descs_;
|
|
ctx_.major_working_cluster_version_=cal_version(3, 1, 0, 0);
|
|
ctx_.row_store_type_ = common::ENCODING_ROW_STORE;
|
|
}
|
|
|
|
static const int64_t test_encoder_overflow = 3;
|
|
static ObObjType test_encoder_over_col_types[3] = {ObIntType, ObTimestampTZType, ObTextType};
|
|
class TestEncoderOverFlow : public TestIColumnEncoder
|
|
{
|
|
public:
|
|
TestEncoderOverFlow()
|
|
{
|
|
rowkey_cnt_ = 1;
|
|
column_cnt_ = test_encoder_overflow;
|
|
col_types_ = reinterpret_cast<ObObjType *>(allocator_.alloc(sizeof(ObObjType) * column_cnt_));
|
|
for (int64_t i = 0; i < column_cnt_; ++i) {
|
|
col_types_[i] = test_encoder_over_col_types[i];
|
|
}
|
|
}
|
|
virtual ~TestEncoderOverFlow()
|
|
{
|
|
allocator_.free(col_types_);
|
|
}
|
|
};
|
|
|
|
TEST_F(TestEncoderOverFlow, test_append_row_with_timestamp_and_max_estimate_limit)
|
|
{
|
|
common::ObClusterVersion::get_instance().update_cluster_version(cal_version(2, 2, 0, 75));
|
|
ObMicroBlockEncoder encoder;
|
|
ASSERT_EQ(OB_SUCCESS, encoder.init(ctx_));
|
|
|
|
encoder.estimate_size_limit_ = ctx_.macro_block_size_;
|
|
|
|
ObDatumRow row;
|
|
ASSERT_EQ(OB_SUCCESS, row.init(allocator_, column_cnt_));
|
|
int ret = OB_SUCCESS;
|
|
int row_cnt = 0;
|
|
// calculated max size 4444 for this schema
|
|
while(row_cnt < 4443) {
|
|
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(row));
|
|
ret = encoder.append_row(row);
|
|
row_cnt++;
|
|
}
|
|
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(row));
|
|
row.storage_datums_[2].len_ = 105000;
|
|
encoder.append_row(row);
|
|
|
|
LOG_INFO("Data buffer size", K(encoder.data_buffer_),
|
|
K(row_cnt), K(encoder.estimate_size_limit_), K(encoder.estimate_size_),
|
|
K(encoder.length_));
|
|
|
|
char *buf = NULL;
|
|
int64_t size = 0;
|
|
ASSERT_EQ(OB_SUCCESS, encoder.build_block(buf, size));
|
|
}
|
|
|
|
static ObObjType test_dict_large_varchar[2] = {ObIntType, ObVarcharType};
|
|
class TestDictLargeVarchar : public TestIColumnEncoder
|
|
{
|
|
public:
|
|
TestDictLargeVarchar() : TestIColumnEncoder(true)
|
|
{
|
|
rowkey_cnt_ = 1;
|
|
column_cnt_ = 2;
|
|
col_types_ = reinterpret_cast<ObObjType *>(allocator_.alloc(sizeof(ObObjType) * column_cnt_));
|
|
for (int64_t i = 0; i < column_cnt_; ++i) {
|
|
col_types_[i] = test_dict_large_varchar[i];
|
|
}
|
|
}
|
|
virtual ~TestDictLargeVarchar()
|
|
{
|
|
allocator_.free(col_types_);
|
|
}
|
|
|
|
int64_t full_column_cnt_ = 4;
|
|
};
|
|
|
|
TEST_F(TestDictLargeVarchar, test_dict_large_varchar)
|
|
{
|
|
ctx_.column_encodings_ = static_cast<int64_t *>(allocator_.alloc(sizeof(int64_t) * full_column_cnt_));
|
|
for (int64_t i = 0; i < full_column_cnt_; ++i) {
|
|
ctx_.column_encodings_[i] = ObColumnHeader::Type::DICT;
|
|
}
|
|
ObMicroBlockEncoder encoder;
|
|
ASSERT_EQ(OB_SUCCESS, encoder.init(ctx_));
|
|
|
|
ObDatumRow row;
|
|
ASSERT_EQ(OB_SUCCESS, row.init(allocator_, full_column_cnt_));
|
|
const int64_t varchar_data_size = UINT16_MAX * 2 + 1;
|
|
char *varchar_data = static_cast<char *>(allocator_.alloc(varchar_data_size));
|
|
ASSERT_TRUE(nullptr != varchar_data);
|
|
MEMSET(varchar_data, 7, varchar_data_size);
|
|
row.storage_datums_[0].set_int(1);
|
|
row.storage_datums_[3].set_string(varchar_data, varchar_data_size);
|
|
|
|
ASSERT_EQ(OB_SUCCESS, encoder.append_row(row));
|
|
|
|
char *buf = nullptr;
|
|
int64_t size = 0;
|
|
ASSERT_EQ(OB_SUCCESS, encoder.build_block(buf, size));
|
|
|
|
ObMicroBlockData micro_data(buf, size);
|
|
ObMicroBlockDecoder decoder;
|
|
ObDatumRow read_row;
|
|
ASSERT_EQ(OB_SUCCESS, read_row.init(full_column_cnt_));
|
|
ASSERT_EQ(OB_SUCCESS, decoder.init(micro_data, nullptr));
|
|
ASSERT_EQ(OB_SUCCESS, decoder.get_row(0, read_row));
|
|
STORAGE_LOG(DEBUG, "read row", K(read_row));
|
|
|
|
ASSERT_EQ(row.storage_datums_[3].len_, read_row.storage_datums_[3].len_);
|
|
ASSERT_TRUE(ObDatum::binary_equal(row.storage_datums_[3], read_row.storage_datums_[3]));
|
|
}
|
|
|
|
|
|
static ObObjType test_column_equal_exception_list[3] = {ObIntType, ObVarcharType, ObVarcharType};
|
|
class TestColumnEqualExceptionList : public TestIColumnEncoder
|
|
{
|
|
public:
|
|
TestColumnEqualExceptionList()
|
|
{
|
|
rowkey_cnt_ = 1;
|
|
column_cnt_ = 3;
|
|
col_types_ = reinterpret_cast<ObObjType *>(allocator_.alloc(sizeof(ObObjType) * column_cnt_));
|
|
for (int64_t i = 0; i < column_cnt_; ++i) {
|
|
col_types_[i] = test_column_equal_exception_list[i];
|
|
}
|
|
}
|
|
virtual ~TestColumnEqualExceptionList()
|
|
{
|
|
allocator_.free(col_types_);
|
|
}
|
|
};
|
|
|
|
TEST_F(TestColumnEqualExceptionList, test_column_equal_ext_offset_overflow)
|
|
{
|
|
const int64_t fixed_varchar_len = 1024;
|
|
char *fixed_varchar = static_cast<char *>(allocator_.alloc(fixed_varchar_len));
|
|
const int64_t diff_varchar_len = 16384; // 16kB
|
|
char *diff_varchar1 = static_cast<char *>(allocator_.alloc(diff_varchar_len));
|
|
char *diff_varchar2 = static_cast<char *>(allocator_.alloc(diff_varchar_len));
|
|
ASSERT_NE(diff_varchar1, nullptr);
|
|
ASSERT_NE(diff_varchar2, nullptr);
|
|
MEMSET(diff_varchar1, 0, diff_varchar_len);
|
|
MEMSET(diff_varchar2, 1, diff_varchar_len);
|
|
|
|
ObMicroBlockEncoder encoder;
|
|
ctx_.micro_block_size_ = 1 << 20; // 1MB
|
|
ASSERT_EQ(OB_SUCCESS, encoder.init(ctx_));
|
|
encoder.estimate_size_limit_ = ctx_.macro_block_size_;
|
|
encoder.set_micro_block_merge_verify_level(MICRO_BLOCK_MERGE_VERIFY_LEVEL::ENCODING_AND_COMPRESSION);
|
|
|
|
ObDatumRow row;
|
|
ASSERT_EQ(OB_SUCCESS, row.init(allocator_, column_cnt_));
|
|
|
|
int64_t row_cnt = 0;
|
|
for (int64_t i = 0; i < 200; ++i) {
|
|
MEMSET(fixed_varchar, i, fixed_varchar_len);
|
|
row.storage_datums_[0].set_int(1);
|
|
row.storage_datums_[1].set_string(fixed_varchar, fixed_varchar_len);
|
|
row.storage_datums_[2].set_string(fixed_varchar, fixed_varchar_len);
|
|
ASSERT_EQ(OB_SUCCESS, encoder.append_row(row));
|
|
++row_cnt;
|
|
}
|
|
|
|
for (int64_t i = 0; i < 8; ++i) {
|
|
MEMSET(diff_varchar1, i, diff_varchar_len);
|
|
MEMSET(diff_varchar2, 16 + i, diff_varchar_len);
|
|
row.storage_datums_[0].set_int(2);
|
|
row.storage_datums_[1].set_string(diff_varchar1, diff_varchar_len - i);
|
|
row.storage_datums_[2].set_string(diff_varchar2, diff_varchar_len - i);
|
|
ASSERT_EQ(OB_SUCCESS, encoder.append_row(row));
|
|
++row_cnt;
|
|
}
|
|
|
|
ASSERT_EQ(row_cnt, encoder.get_row_count());
|
|
const int64_t encoder_checksum = encoder.get_micro_block_checksum();
|
|
|
|
STORAGE_LOG(INFO, "before build block", K(encoder_checksum), K(row_cnt), K(encoder.get_row_count()));
|
|
|
|
char *buf = nullptr;
|
|
int64_t size = 0;
|
|
ASSERT_EQ(OB_SUCCESS, encoder.build_block(buf, size));
|
|
STORAGE_LOG(INFO, "after build block", KPC(encoder.encoders_[0]), KPC(encoder.encoders_[1]), KPC(encoder.encoders_[2]));
|
|
ASSERT_EQ(encoder.encoders_[1]->get_type(), ObColumnHeader::COLUMN_EQUAL);
|
|
ObColumnEqualEncoder *ce_encoder = static_cast<ObColumnEqualEncoder *>(encoder.encoders_[1]);
|
|
ASSERT_EQ(true, ce_encoder->base_meta_writer_.meta_.is_var_exc());
|
|
|
|
// decode and checksum
|
|
ObMicroBlockData micro_data(buf, size);
|
|
ObMicroBlockDecoder decoder;
|
|
ObDatumRow read_row;
|
|
ASSERT_EQ(OB_SUCCESS, read_row.init(column_cnt_));
|
|
ASSERT_EQ(OB_SUCCESS, decoder.init(micro_data, nullptr));
|
|
|
|
int64_t new_checksum = 0;
|
|
for (int64_t i = 0; i < row_cnt; ++i) {
|
|
ASSERT_EQ(OB_SUCCESS, decoder.get_row(i, read_row));
|
|
STORAGE_LOG(DEBUG, "read row", K(read_row));
|
|
for (int64_t j = 0; j < column_cnt_; ++j) {
|
|
const bool is_invalid_datum = (read_row.storage_datums_[j].is_null() && read_row.storage_datums_[j].len_ != 0);
|
|
ASSERT_EQ(false, is_invalid_datum);
|
|
}
|
|
new_checksum = ObIMicroBlockWriter::cal_row_checksum(read_row, new_checksum);
|
|
}
|
|
ASSERT_EQ(new_checksum, encoder_checksum);
|
|
|
|
|
|
}
|
|
|
|
class TestEncodingRowBufHolder : public ::testing::Test
|
|
{
|
|
public:
|
|
TestEncodingRowBufHolder() {}
|
|
virtual ~TestEncodingRowBufHolder() {}
|
|
virtual void SetUp() {}
|
|
virtual void TearDown() {}
|
|
};
|
|
|
|
TEST_F(TestEncodingRowBufHolder, test_encoding_row_buf_holder)
|
|
{
|
|
ObEncodingRowBufHolder buf_holder;
|
|
ASSERT_EQ(OB_NOT_INIT, buf_holder.try_alloc(12345));
|
|
ASSERT_EQ(OB_SUCCESS, buf_holder.init(OB_DEFAULT_MACRO_BLOCK_SIZE));
|
|
ASSERT_EQ(OB_INVALID_ARGUMENT, buf_holder.try_alloc(4 * OB_DEFAULT_MACRO_BLOCK_SIZE));
|
|
const char *test_mark = "fly me to the moon";
|
|
|
|
const int test_mark_len = strlen(test_mark);
|
|
const int64_t first_alloc_size = 4096;
|
|
const int64_t snd_alloc_size = static_cast<int64_t>(first_alloc_size * 1.2);
|
|
const int64_t trd_alloc_size = first_alloc_size * 10;
|
|
ASSERT_EQ(OB_SUCCESS, buf_holder.try_alloc(first_alloc_size));
|
|
MEMCPY(buf_holder.get_buf(), test_mark, test_mark_len);
|
|
const char *first_alloc_buf = buf_holder.get_buf();
|
|
|
|
ASSERT_EQ(OB_SUCCESS, buf_holder.try_alloc(snd_alloc_size));
|
|
ASSERT_EQ(first_alloc_buf, buf_holder.get_buf());
|
|
int cmp_ret = MEMCMP(test_mark, buf_holder.get_buf(), test_mark_len);
|
|
ASSERT_EQ(cmp_ret, 0);
|
|
ASSERT_EQ(buf_holder.alloc_size_, first_alloc_size * ObEncodingRowBufHolder::EXTRA_MEM_FACTOR);
|
|
|
|
ASSERT_EQ(OB_SUCCESS, buf_holder.try_alloc(trd_alloc_size));
|
|
ASSERT_EQ(buf_holder.alloc_size_, trd_alloc_size * ObEncodingRowBufHolder::EXTRA_MEM_FACTOR);
|
|
|
|
buf_holder.reset();
|
|
ASSERT_EQ(buf_holder.allocator_.arena_.used_, 0);
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
int main(int argc, char **argv)
|
|
{
|
|
system("rm -f test_micro_block_encoder.log*");
|
|
OB_LOGGER.set_file_name("test_micro_block_encoder.log");
|
|
oceanbase::common::ObLogger::get_logger().set_log_level("INFO");
|
|
testing::InitGoogleTest(&argc, argv);
|
|
return RUN_ALL_TESTS();
|
|
}
|