Files
oceanbase/unittest/storage/blocksstable/test_micro_block_writer.cpp

294 lines
10 KiB
C++

/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#include <gtest/gtest.h>
#define private public
#define protected public
#include "storage/blocksstable/ob_micro_block_writer.h"
#include "storage/blocksstable/ob_micro_block_reader.h"
#include "ob_row_generate.h"
namespace oceanbase
{
using namespace common;
using namespace blocksstable;
using namespace storage;
using namespace share::schema;
namespace unittest
{
class TestMicroBlockWriter : public ::testing::Test
{
public:
static const int64_t rowkey_column_count = 2;
// Every ObObjType from ObTinyIntType to ObHexStringType inclusive.
// Skip ObNullType and ObExtendType because for external usage, a column type
// can't be NULL or NOP.
static const int64_t column_num = ObHexStringType;
static const int64_t macro_block_size = 2L * 1024 * 1024L;
static const int64_t SNAPSHOT_VERSION = 2;
public:
TestMicroBlockWriter() : allocator_(ObModIds::TEST), read_info_() {};
void SetUp();
virtual void TearDown() {}
void test_alloc(char *&ptr, const int64_t size);
protected:
ObRowGenerate row_generate_;
ObArenaAllocator allocator_;
ObTableReadInfo read_info_;
};
static void convert_to_multi_version_row(const ObDatumRow &org_row,
const ObTableSchema &schema, const int64_t snapshot_version,
ObDatumRow &multi_row)
{
int64_t rowkey_column_count = schema.get_rowkey_column_num();
for (int64_t i = 0; i < schema.get_column_count(); ++i) {
if (i < rowkey_column_count) {
multi_row.storage_datums_[i] = org_row.storage_datums_[i];
} else {
multi_row.storage_datums_[i + 2] = org_row.storage_datums_[i];
}
}
multi_row.storage_datums_[schema.get_rowkey_column_num()].set_int(-snapshot_version);
multi_row.storage_datums_[schema.get_rowkey_column_num() + 1].set_int(0);
multi_row.row_flag_= org_row.row_flag_;
}
void TestMicroBlockWriter::test_alloc(char *&ptr, const int64_t size)
{
ptr = reinterpret_cast<char*>(allocator_.alloc(size));
ASSERT_TRUE(nullptr != ptr);
}
void TestMicroBlockWriter::SetUp()
{
oceanbase::ObClusterVersion::get_instance().update_data_version(DATA_CURRENT_VERSION);
const int64_t table_id = 3001;
ObTableSchema table_schema;
ObColumnSchemaV2 column;
//init table schema
table_schema.reset();
ASSERT_EQ(OB_SUCCESS, table_schema.set_table_name("test_row_writer"));
table_schema.set_tenant_id(1);
table_schema.set_tablegroup_id(1);
table_schema.set_database_id(1);
table_schema.set_table_id(table_id);
table_schema.set_rowkey_column_num(rowkey_column_count);
table_schema.set_max_used_column_id(column_num);
//init column
char name[OB_MAX_FILE_NAME_LENGTH];
memset(name, 0, sizeof(name));
for(int64_t i = 0; i < column_num; ++i){
ObObjType obj_type = static_cast<ObObjType>(i + 1);
column.reset();
column.set_collation_type(CS_TYPE_BINARY);
column.set_table_id(table_id);
column.set_column_id(i + OB_APP_MIN_COLUMN_ID);
sprintf(name, "test%020ld", i);
ASSERT_EQ(OB_SUCCESS, column.set_column_name(name));
column.set_data_type(obj_type);
if(obj_type == common::ObIntType){
column.set_rowkey_position(1);
} else if (obj_type == common::ObNumberType){
column.set_rowkey_position(2);
} else {
column.set_rowkey_position(0);
}
column.set_collation_type(ObCollationType::CS_TYPE_UTF8MB4_GENERAL_CI);
ASSERT_EQ(OB_SUCCESS, table_schema.add_column(column));
}
//init ObRowGenerate
ASSERT_EQ(OB_SUCCESS, row_generate_.init(table_schema));
}
TEST_F(TestMicroBlockWriter, test_init)
{
int ret = OB_SUCCESS;
ObMicroBlockWriter writer;
writer.data_buffer_.allocator_.set_tenant_id(500);
writer.index_buffer_.allocator_.set_tenant_id(500);
//invalid macro_block_size
ret = writer.init(0, 2, 5);
ASSERT_EQ(OB_INVALID_ARGUMENT, ret);
//invalid column_count
ret = writer.init(1024, 2, 0);
ASSERT_EQ(OB_INVALID_ARGUMENT, ret);
//invalid rowkey_column_count
ret = writer.init(1024, 6, 5);
ASSERT_EQ(OB_INVALID_ARGUMENT, ret);
//success
ret = writer.init(1024, 2, 5);
ASSERT_EQ(OB_SUCCESS, ret);
ASSERT_EQ(sizeof(ObMicroBlockHeader)+4, writer.get_block_size());
ASSERT_EQ(0, writer.get_row_count());
ASSERT_EQ(sizeof(ObMicroBlockHeader), writer.get_data_size());
}
TEST_F(TestMicroBlockWriter, append_success)
{
int ret = OB_SUCCESS;
const int64_t test_row_num = 100;
ObDatumRow row;
ASSERT_EQ(OB_SUCCESS, row.init(allocator_, column_num));
ObDatumRow multi_version_row;
ASSERT_EQ(OB_SUCCESS, multi_version_row.init(allocator_, column_num + 2));
ObMicroBlockWriter writer;
writer.data_buffer_.allocator_.set_tenant_id(500);
writer.index_buffer_.allocator_.set_tenant_id(500);
ret = writer.init(macro_block_size, rowkey_column_count, column_num + 2);
ASSERT_EQ(OB_SUCCESS, ret);
for(int64_t i = 0; i < test_row_num; ++i){
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(row));
convert_to_multi_version_row(row, row_generate_.get_schema(), SNAPSHOT_VERSION, multi_version_row);
ASSERT_EQ(OB_SUCCESS, writer.append_row(multi_version_row));
}
char *buf = NULL;
int64_t size = 0;
ret = writer.build_block(buf, size);
ASSERT_EQ(OB_SUCCESS, ret);
//check ObMicroBlockWriter right by ObMicroBlockReader and ObRowGenerate
ObArray<ObColDesc> columns;
ASSERT_EQ(OB_SUCCESS, row_generate_.get_schema().get_column_ids(columns));
ObTableReadInfo read_info;
ASSERT_EQ(OB_SUCCESS, read_info_.init(
allocator_, 16000, row_generate_.get_schema().get_rowkey_column_num(), lib::is_oracle_mode(), columns, nullptr/*storage_cols_index*/));
ObMicroBlockReader reader;
ObMicroBlockData block(buf, size);
ret = reader.init(block, read_info_);
ASSERT_EQ(OB_SUCCESS, ret);
ObDatumRow read_row;
ASSERT_EQ(OB_SUCCESS, read_row.init(allocator_, column_num));
for(int64_t i = 0; i < test_row_num; ++ i){
ASSERT_EQ(OB_SUCCESS, reader.get_row(i, read_row));
bool exist = false;
ASSERT_EQ(OB_SUCCESS, row_generate_.check_one_row(read_row, exist));
ASSERT_TRUE(exist) << "i: " << i;
//every obj should equal
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(i, row));
for (int64_t j = 0; j < column_num ; ++ j){
ObCStringHelper helper;
ASSERT_TRUE(read_row.storage_datums_[j] == row.storage_datums_[j])
<< "\n i: " << i << " j: " << j
<< "\n writer: "<< helper.convert(row.storage_datums_[j])
<< "\n reader: " << helper.convert(read_row.storage_datums_[j]);
}
}
}
TEST_F(TestMicroBlockWriter, append_row_error)
{
int ret = OB_SUCCESS;
ObDatumRow row;
ASSERT_EQ(OB_SUCCESS, row.init(allocator_, column_num));
ObDatumRow multi_version_row;
ASSERT_EQ(OB_SUCCESS, multi_version_row.init(allocator_, column_num + 2));
//not init
ObMicroBlockWriter writer;
writer.data_buffer_.allocator_.set_tenant_id(500);
writer.index_buffer_.allocator_.set_tenant_id(500);
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(row));
convert_to_multi_version_row(row, row_generate_.get_schema(), SNAPSHOT_VERSION, multi_version_row);
ASSERT_EQ(OB_NOT_INIT, writer.append_row(multi_version_row));
//column count not equal
ret = writer.init(macro_block_size, rowkey_column_count, column_num + 1);
ASSERT_EQ(OB_SUCCESS, ret);
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(row));
convert_to_multi_version_row(row, row_generate_.get_schema(), SNAPSHOT_VERSION, multi_version_row);
ASSERT_EQ(OB_INVALID_ARGUMENT, writer.append_row(multi_version_row));
//fail to write not support type
ret = writer.init(macro_block_size, rowkey_column_count, column_num + 2);
ASSERT_EQ(OB_SUCCESS, ret);
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(row));
}
TEST_F(TestMicroBlockWriter, build_block_error)
{
char *buf = NULL;
int64_t size = 0;
ObDatumRow row;
ASSERT_EQ(OB_SUCCESS, row.init(allocator_, column_num));
//not init
ObMicroBlockWriter writer;
writer.data_buffer_.allocator_.set_tenant_id(500);
writer.index_buffer_.allocator_.set_tenant_id(500);
ASSERT_EQ(OB_SUCCESS, row_generate_.get_next_row(row));
ASSERT_EQ(OB_NOT_INIT, writer.build_block(buf, size));
}
TEST_F(TestMicroBlockWriter, init_max_column_count)
{
// data_buffer_ and index_buffer_ in ObMicroBlockWriter should init succeed
ObMicroBlockWriter writer;
writer.data_buffer_.allocator_.set_tenant_id(500);
writer.index_buffer_.allocator_.set_tenant_id(500);
int64_t ret = writer.init(
common::OB_DEFAULT_MACRO_BLOCK_SIZE,
1,
common::OB_ROW_MAX_COLUMNS_COUNT
);
ASSERT_EQ(OB_SUCCESS, ret);
}
TEST_F(TestMicroBlockWriter, append_large_row)
{
// create a large row whose size is 1.5MB
int64_t large_row_col_cnt = 2;
ObDatumRow row;
ASSERT_EQ(OB_SUCCESS, row.init(allocator_, large_row_col_cnt));
row.row_flag_.set_flag(ObDmlFlag::DF_INSERT);
int32_t value1_size = 1024 * 1024;
char *ptr1 = nullptr;
test_alloc(ptr1, value1_size);
ASSERT_TRUE(nullptr != ptr1);
row.storage_datums_[0].set_string(ObString(value1_size, ptr1));
int32_t value2_size = 512 * 1024;
char *ptr2 = nullptr;
test_alloc(ptr2, value2_size);
row.storage_datums_[1].set_string(ObString(value2_size, ptr2));
ObMicroBlockWriter writer;
writer.data_buffer_.allocator_.set_tenant_id(500);
writer.index_buffer_.allocator_.set_tenant_id(500);
int64_t ret = writer.init(common::OB_DEFAULT_MACRO_BLOCK_SIZE, 1, large_row_col_cnt);
ASSERT_EQ(OB_SUCCESS, ret);
// append large row;
ret = writer.append_row(row);
ASSERT_EQ(OB_SUCCESS, ret);
}
}//end namespace unittest
}//end namespace oceanbase
int main(int argc, char **argv)
{
system("rm -rf test_micro_block_writer.log");
OB_LOGGER.set_file_name("test_micro_block_writer.log", true, true);
oceanbase::common::ObLogger::get_logger().set_log_level("INFO");
testing::InitGoogleTest(&argc, argv);
return RUN_ALL_TESTS();
}