Files
doris/be/test/olap/row_block_test.cpp
chenhao7253886 37b4cafe87 Change variable and namespace name in BE (#268)
Change 'palo' to 'doris'
2018-11-02 10:22:32 +08:00

810 lines
24 KiB
C++

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include <gtest/gtest.h>
#include <sstream>
#include "common/object_pool.h"
#include "exprs/expr.h"
#include "exprs/expr_context.h"
#include "olap/row_block.h"
#include "olap/olap_table.h"
#include "runtime/runtime_state.h"
#include "util/debug_util.h"
#include "util/logging.h"
using std::vector;
using std::string;
using std::endl;
using std::stringstream;
namespace doris {
class TestRowBlock : public testing::Test {
public:
TestRowBlock() {}
void SetUp() {
}
void TearDown() {
}
void SetRows(RowBlock& row_block) {
}
};
TEST_F(TestRowBlock, init) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
{
// has nullbyte
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = true;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
// num_rows * (num_nullbytes + bigint + char + varchar)
ASSERT_EQ(1024 * (3 + 8 + 10 + (4 + 20)), block.buf_len());
}
{
// has nullbyte
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = false;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
// num_rows * (num_nullbytes + bigint + char + varchar)
ASSERT_EQ(1024 * (8 + 10 + (4 + 20)), block.buf_len());
}
}
TEST_F(TestRowBlock, write_and_read) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
//
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = true;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
RowCursor row;
row.init(fields);
for (int i = 0; i < 5; ++i) {
block.get_row(i, &row);
// bigint
{
int64_t val = i;
row.set_not_null(0);
row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'a' + i, 10);
StringSlice val(buf, 10);
row.set_not_null(1);
row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0' + i, 10);
StringSlice val(buf, 10);
row.set_not_null(2);
row.set_field_content(2, (const char*)&val, block.mem_pool());
}
}
block.finalize(5);
ASSERT_EQ(5, block.row_num());
char serialized_buf[2048];
size_t written_len = 0;
res = block.serialize_to_row_format(serialized_buf, 2048, &written_len, OLAP_COMP_STORAGE);
ASSERT_EQ(OLAP_SUCCESS, res);
{
RowBlock resolve_block(fields);
block_info.checksum = block.row_block_info().checksum;
block_info.row_num = 5;
res = resolve_block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
res = resolve_block.decompress(serialized_buf, written_len, OLAP_COMP_STORAGE);
ASSERT_EQ(OLAP_SUCCESS, res);
ASSERT_EQ(5, resolve_block.row_num());
for (int i = 0; i < 5; ++i) {
resolve_block.get_row(i, &row);
{
ASSERT_FALSE(row.is_null(0));
ASSERT_EQ(i, *(int64_t*)row.get_field_content_ptr(0));
}
{
ASSERT_FALSE(row.is_null(1));
StringSlice* slice = (StringSlice*)row.get_field_content_ptr(1);
char buf[10];
memset(buf, 'a' + i, 10);
ASSERT_EQ(10, slice->size);
ASSERT_EQ(0, memcmp(buf, slice->data, 10));
}
{
ASSERT_FALSE(row.is_null(2));
StringSlice* slice = (StringSlice*)row.get_field_content_ptr(2);
char buf[20];
memset(buf, '0' + i, 10);
ASSERT_EQ(10, slice->size);
ASSERT_EQ(0, memcmp(buf, slice->data, 10));
}
}
}
}
TEST_F(TestRowBlock, write_and_read_without_nullbyte) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
//
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = false;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
RowCursor row;
row.init(fields);
for (int i = 0; i < 5; ++i) {
block.get_row(i, &row);
// bigint
{
int64_t val = i;
row.set_not_null(0);
row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'a' + i, 10);
StringSlice val(buf, 10);
row.set_not_null(1);
row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0' + i, 10);
StringSlice val(buf, 10);
row.set_not_null(2);
row.set_field_content(2, (const char*)&val, block.mem_pool());
}
}
block.finalize(5);
ASSERT_EQ(5, block.row_num());
char serialized_buf[2048];
size_t written_len = 0;
res = block.serialize_to_row_format(serialized_buf, 2048, &written_len, OLAP_COMP_STORAGE);
ASSERT_EQ(OLAP_SUCCESS, res);
{
RowBlock resolve_block(fields);
block_info.checksum = block.row_block_info().checksum;
block_info.row_num = 5;
res = resolve_block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
res = resolve_block.decompress(serialized_buf, written_len, OLAP_COMP_STORAGE);
ASSERT_EQ(OLAP_SUCCESS, res);
ASSERT_EQ(5, resolve_block.row_num());
for (int i = 0; i < 5; ++i) {
resolve_block.get_row(i, &row);
{
ASSERT_FALSE(row.is_null(0));
ASSERT_EQ(i, *(int64_t*)row.get_field_content_ptr(0));
}
{
ASSERT_FALSE(row.is_null(1));
StringSlice* slice = (StringSlice*)row.get_field_content_ptr(1);
char buf[10];
memset(buf, 'a' + i, 10);
ASSERT_EQ(10, slice->size);
ASSERT_EQ(0, memcmp(buf, slice->data, 10));
}
{
ASSERT_FALSE(row.is_null(2));
StringSlice* slice = (StringSlice*)row.get_field_content_ptr(2);
char buf[20];
memset(buf, '0' + i, 10);
ASSERT_EQ(10, slice->size);
ASSERT_EQ(0, memcmp(buf, slice->data, 10));
}
}
}
}
TEST_F(TestRowBlock, compress_failed) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
//
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = true;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
RowCursor row;
row.init(fields);
for (int i = 0; i < 5; ++i) {
block.get_row(i, &row);
// bigint
{
int64_t val = i;
row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'a' + i, 10);
StringSlice val(buf, 10);
row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0' + i, 10);
StringSlice val(buf, 10);
row.set_field_content(2, (const char*)&val, block.mem_pool());
}
}
block.finalize(5);
ASSERT_EQ(5, block.row_num());
char serialized_buf[2048];
size_t written_len = 0;
res = block.serialize_to_row_format(serialized_buf, 1, &written_len, OLAP_COMP_STORAGE);
ASSERT_NE(OLAP_SUCCESS, res);
}
TEST_F(TestRowBlock, decompress_failed) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
//
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = true;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
RowCursor row;
row.init(fields);
for (int i = 0; i < 5; ++i) {
block.get_row(i, &row);
// bigint
{
int64_t val = i;
row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'a' + i, 10);
StringSlice val(buf, 10);
row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0' + i, 10);
StringSlice val(buf, 10);
row.set_field_content(2, (const char*)&val, block.mem_pool());
}
}
block.finalize(5);
ASSERT_EQ(5, block.row_num());
char serialized_buf[2048];
size_t written_len = 0;
res = block.serialize_to_row_format(serialized_buf, 2048, &written_len, OLAP_COMP_STORAGE);
ASSERT_EQ(OLAP_SUCCESS, res);
{
// checksum failed
RowBlock resolve_block(fields);
block_info.checksum = 0;
block_info.row_num = 5;
res = resolve_block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
res = resolve_block.decompress(serialized_buf, written_len, OLAP_COMP_STORAGE);
ASSERT_NE(OLAP_SUCCESS, res);
}
{
// buffer is not ok
RowBlock resolve_block(fields);
block_info.checksum = block.row_block_info().checksum;
block_info.row_num = 5;
res = resolve_block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
res = resolve_block.decompress(serialized_buf, written_len - 1, OLAP_COMP_STORAGE);
ASSERT_NE(OLAP_SUCCESS, res);
}
}
TEST_F(TestRowBlock, find_row) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
//
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = true;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
RowCursor row;
row.init(fields);
for (int i = 0; i < 5; ++i) {
block.get_row(i, &row);
// bigint
{
int64_t val = i;
row.set_not_null(0);
row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'a' + i, 10);
StringSlice val(buf, 10);
row.set_not_null(1);
row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0' + i, 10);
StringSlice val(buf, 10);
row.set_not_null(2);
row.set_field_content(2, (const char*)&val, block.mem_pool());
}
}
block.finalize(5);
ASSERT_EQ(5, block.row_num());
{
RowCursor find_row;
find_row.init(fields);
for (int i = 0; i < 5; ++i) {
// bigint
{
int64_t val = i;
find_row.set_not_null(0);
find_row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'a' + i, 10);
StringSlice val(buf, 10);
find_row.set_not_null(1);
find_row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0' + i, 10);
StringSlice val(buf, 10);
find_row.set_not_null(2);
find_row.set_field_content(2, (const char*)&val, block.mem_pool());
}
uint32_t row_index;
res = block.find_row(find_row, false, &row_index);
ASSERT_EQ(OLAP_SUCCESS, res);
ASSERT_EQ(i, row_index);
res = block.find_row(find_row, true, &row_index);
ASSERT_EQ(OLAP_SUCCESS, res);
ASSERT_EQ(i + 1, row_index);
}
{
// bigint
{
int64_t val = 1;
find_row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'c', 9);
StringSlice val(buf, 9);
find_row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0', 10);
StringSlice val(buf, 10);
find_row.set_field_content(2, (const char*)&val, block.mem_pool());
}
uint32_t row_index;
res = block.find_row(find_row, true, &row_index);
ASSERT_EQ(OLAP_SUCCESS, res);
ASSERT_EQ(2, row_index);
}
{
// bigint
{
int64_t val = -1;
find_row.set_field_content(0, (const char*)&val, block.mem_pool());
}
// char
{
char buf[10];
memset(buf, 'c', 9);
StringSlice val(buf, 9);
find_row.set_field_content(1, (const char*)&val, block.mem_pool());
}
// varchar
{
char buf[10];
memset(buf, '0', 10);
StringSlice val(buf, 10);
find_row.set_field_content(2, (const char*)&val, block.mem_pool());
}
uint32_t row_index;
res = block.find_row(find_row, true, &row_index);
ASSERT_EQ(OLAP_SUCCESS, res);
ASSERT_EQ(0, row_index);
}
}
}
TEST_F(TestRowBlock, clear) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
//
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = true;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
block.finalize(5);
ASSERT_EQ(5, block.row_num());
ASSERT_EQ(1024, block.capacity());
block.clear();
ASSERT_EQ(1024, block.row_num());
}
TEST_F(TestRowBlock, pos_limit) {
std::vector<FieldInfo> fields;
{
// k1: bigint
{
FieldInfo info;
info.name = "k1";
info.type = OLAP_FIELD_TYPE_BIGINT;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 8;
info.is_key = true;
fields.push_back(info);
}
// k2: char
{
FieldInfo info;
info.name = "k2";
info.type = OLAP_FIELD_TYPE_CHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 10;
info.is_key = true;
fields.push_back(info);
}
// k3: varchar
{
FieldInfo info;
info.name = "k3";
info.type = OLAP_FIELD_TYPE_VARCHAR;
info.aggregation = OLAP_FIELD_AGGREGATION_NONE;
info.length = 20;
info.is_key = true;
fields.push_back(info);
}
}
//
RowBlock block(fields);
RowBlockInfo block_info;
block_info.row_num = 1024;
block_info.data_file_type = OLAP_DATA_FILE;
block_info.null_supported = true;
auto res = block.init(block_info);
ASSERT_EQ(OLAP_SUCCESS, res);
// assert init value
ASSERT_EQ(0, block.pos());
ASSERT_EQ(0, block.limit());
ASSERT_FALSE(block.has_remaining());
ASSERT_EQ(DEL_PARTIAL_SATISFIED, block.block_status());
block.set_limit(100);
ASSERT_EQ(100, block.limit());
ASSERT_TRUE(block.has_remaining());
ASSERT_EQ(100, block.remaining());
block.set_pos(2);
ASSERT_TRUE(block.has_remaining());
ASSERT_EQ(98, block.remaining());
block.pos_inc();
ASSERT_TRUE(block.has_remaining());
ASSERT_EQ(97, block.remaining());
block.set_block_status(DEL_SATISFIED);
ASSERT_EQ(DEL_SATISFIED, block.block_status());
}
}
// @brief Test Stub
int main(int argc, char** argv) {
std::string conffile = std::string(getenv("DORIS_HOME")) + "/conf/be.conf";
if (!doris::config::init(conffile.c_str(), false)) {
fprintf(stderr, "error read config file. \n");
return -1;
}
doris::init_glog("be-test");
int ret = doris::OLAP_SUCCESS;
testing::InitGoogleTest(&argc, argv);
ret = RUN_ALL_TESTS();
return ret;
}