[feature](vectorized) support vexplode_bitmap (#8890)

This commit is contained in:
Pxl
2022-04-08 09:20:26 +08:00
committed by GitHub
parent fa8e4ec2f0
commit dbbc6549bd
7 changed files with 142 additions and 7 deletions

View File

@ -33,13 +33,12 @@ public:
virtual Status forward(bool* eos) override;
private:
protected:
void _reset_iterator();
private:
// Read from tuple row.
// if _cur_bitmap_owned is true, need to delete it when deconstruction
BitmapValue* _cur_bitmap = nullptr;
const BitmapValue* _cur_bitmap = nullptr;
bool _cur_bitmap_owned = false;
// iterator of _cur_bitmap
BitmapValueIterator* _cur_iter = nullptr;

View File

@ -22,9 +22,10 @@
#include "exprs/table_function/explode_json_array.h"
#include "exprs/table_function/explode_split.h"
#include "exprs/table_function/table_function.h"
#include "vec/exprs/table_function/vexplode_bitmap.h"
#include "vec/exprs/table_function/vexplode_json_array.h"
#include "vec/exprs/table_function/vexplode_numbers.h"
#include "vec/exprs/table_function/vexplode_split.h"
#include "vec/exprs/table_function/vexplode_json_array.h"
namespace doris {
@ -36,13 +37,15 @@ struct TableFunctionCreator {
template <>
struct TableFunctionCreator<ExplodeJsonArrayTableFunction> {
ExplodeJsonArrayType type;
TableFunction* operator()() { return new ExplodeJsonArrayTableFunction(type); }
TableFunction* operator()() const { return new ExplodeJsonArrayTableFunction(type); }
};
template <>
struct TableFunctionCreator<vectorized::VExplodeJsonArrayTableFunction> {
ExplodeJsonArrayType type;
TableFunction* operator()() { return new vectorized::VExplodeJsonArrayTableFunction(type); }
TableFunction* operator()() const {
return new vectorized::VExplodeJsonArrayTableFunction(type);
}
};
inline auto ExplodeJsonArrayIntCreator =
@ -76,7 +79,9 @@ const std::unordered_map<std::pair<std::string, bool>, std::function<TableFuncti
TableFunctionCreator<vectorized::VExplodeNumbersTableFunction>()},
{{"explode_json_array_int", true}, VExplodeJsonArrayIntCreator},
{{"explode_json_array_double", true}, VExplodeJsonArrayDoubleCreator},
{{"explode_json_array_string", true}, VExplodeJsonArrayStringCreator}};
{{"explode_json_array_string", true}, VExplodeJsonArrayStringCreator},
{{"explode_bitmap", true},
TableFunctionCreator<vectorized::VExplodeBitmapTableFunction>()}};
Status TableFunctionFactory::get_fn(const std::string& fn_name, bool is_vectorized,
ObjectPool* pool, TableFunction** fn) {

View File

@ -113,6 +113,7 @@ set(VEC_FILES
exprs/vinfo_func.cpp
exprs/table_function/vexplode_split.cpp
exprs/table_function/vexplode_numbers.cpp
exprs/table_function/vexplode_bitmap.cpp
functions/array/function_array_index.cpp
functions/array/function_array_element.cpp
functions/array/function_array_register.cpp

View File

@ -0,0 +1,81 @@
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#include "vec/exprs/table_function/vexplode_bitmap.h"
#include "util/bitmap_value.h"
#include "vec/exprs/vexpr.h"
namespace doris::vectorized {
VExplodeBitmapTableFunction::VExplodeBitmapTableFunction() {
_fn_name = "vexplode_bitmap";
}
Status VExplodeBitmapTableFunction::process_init(vectorized::Block* block) {
CHECK(_vexpr_context->root()->children().size() == 1)
<< "VExplodeNumbersTableFunction must be have 1 children but have "
<< _vexpr_context->root()->children().size();
int value_column_idx = -1;
_vexpr_context->root()->children()[0]->execute(_vexpr_context, block, &value_column_idx);
_value_column = block->get_by_position(value_column_idx).column;
return Status::OK();
}
Status VExplodeBitmapTableFunction::process_row(size_t row_idx) {
_eos = false;
_is_current_empty = false;
_cur_size = 0;
_cur_offset = 0;
StringRef value = _value_column->get_data_at(row_idx);
if (value.data == nullptr) {
_is_current_empty = true;
} else {
_cur_bitmap = reinterpret_cast<const BitmapValue*>(value.data);
_cur_bitmap_owned = false;
_cur_size = _cur_bitmap->cardinality();
if (_cur_size == 0) {
_is_current_empty = true;
} else {
_reset_iterator();
}
}
_is_current_empty = (_cur_size == 0);
return Status::OK();
}
Status VExplodeBitmapTableFunction::process_close() {
_value_column = nullptr;
return Status::OK();
}
Status VExplodeBitmapTableFunction::get_value_length(int64_t* length) {
if (_is_current_empty) {
*length = -1;
} else {
*length = sizeof(uint64_t);
}
return Status::OK();
}
} // namespace doris::vectorized

View File

@ -0,0 +1,40 @@
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#pragma once
#include "exprs/table_function/explode_bitmap.h"
#include "exprs/table_function/table_function.h"
#include "util/bitmap_value.h"
#include "vec/columns/column.h"
namespace doris::vectorized {
class VExplodeBitmapTableFunction : public ExplodeBitmapTableFunction {
public:
VExplodeBitmapTableFunction();
Status process_init(vectorized::Block* block) override;
Status process_row(size_t row_idx) override;
Status process_close() override;
Status get_value_length(int64_t* length) override;
private:
ColumnPtr _value_column;
};
} // namespace doris::vectorized

View File

@ -26,6 +26,7 @@ void register_function_fake(SimpleFunctionFactory& factory) {
factory.register_function<FunctionFake<FunctionExplodeJsonArrayDoubleImpl>>();
factory.register_function<FunctionFake<FunctionExplodeJsonArrayIntImpl>>();
factory.register_function<FunctionFake<FunctionExplodeJsonArrayStringImpl>>();
factory.register_function<FunctionFake<FunctionExplodeBitmapImpl>>();
}
} // namespace doris::vectorized

View File

@ -67,6 +67,14 @@ struct FunctionExplodeJsonArrayDoubleImpl {
return std::make_shared<DataTypeFloat64>();
}
};
struct FunctionExplodeBitmapImpl {
static constexpr auto name = "explode_bitmap";
static DataTypePtr get_return_type_impl(const DataTypes& arguments) {
return std::make_shared<DataTypeInt64>();
}
};
//FunctionFake is use for some function call expr only work at prepare/open phase, do not support execute().
template <typename Impl>
class FunctionFake : public IFunction {