[enhance](match) Support match query without inverted index (#19936)
This commit is contained in:
141
be/src/vec/exprs/vmatch_predicate.cpp
Normal file
141
be/src/vec/exprs/vmatch_predicate.cpp
Normal file
@ -0,0 +1,141 @@
|
||||
// Licensed to the Apache Software Foundation (ASF) under one
|
||||
// or more contributor license agreements. See the NOTICE file
|
||||
// distributed with this work for additional information
|
||||
// regarding copyright ownership. The ASF licenses this file
|
||||
// to you under the Apache License, Version 2.0 (the
|
||||
// "License"); you may not use this file except in compliance
|
||||
// with the License. You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing,
|
||||
// software distributed under the License is distributed on an
|
||||
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
||||
// KIND, either express or implied. See the License for the
|
||||
// specific language governing permissions and limitations
|
||||
// under the License.
|
||||
|
||||
#include "vec/exprs/vmatch_predicate.h"
|
||||
|
||||
#include <fmt/format.h>
|
||||
#include <fmt/ranges.h> // IWYU pragma: keep
|
||||
#include <gen_cpp/Exprs_types.h>
|
||||
#include <glog/logging.h>
|
||||
#include <stddef.h>
|
||||
|
||||
#include <algorithm>
|
||||
#include <memory>
|
||||
#include <ostream>
|
||||
#include <string_view>
|
||||
#include <vector>
|
||||
|
||||
#include "common/status.h"
|
||||
#include "vec/core/block.h"
|
||||
#include "vec/core/column_numbers.h"
|
||||
#include "vec/core/column_with_type_and_name.h"
|
||||
#include "vec/core/columns_with_type_and_name.h"
|
||||
#include "vec/exprs/vexpr_context.h"
|
||||
#include "vec/functions/simple_function_factory.h"
|
||||
|
||||
namespace doris {
|
||||
class RowDescriptor;
|
||||
class RuntimeState;
|
||||
} // namespace doris
|
||||
|
||||
namespace doris::vectorized {
|
||||
|
||||
VMatchPredicate::VMatchPredicate(const TExprNode& node) : VExpr(node) {
|
||||
_inverted_index_ctx = std::make_shared<InvertedIndexCtx>();
|
||||
_inverted_index_ctx->parser_type =
|
||||
get_inverted_index_parser_type_from_string(node.match_predicate.parser_type);
|
||||
_inverted_index_ctx->parser_mode = node.match_predicate.parser_mode;
|
||||
}
|
||||
|
||||
Status VMatchPredicate::prepare(RuntimeState* state, const RowDescriptor& desc,
|
||||
VExprContext* context) {
|
||||
RETURN_IF_ERROR_OR_PREPARED(VExpr::prepare(state, desc, context));
|
||||
|
||||
ColumnsWithTypeAndName argument_template;
|
||||
argument_template.reserve(_children.size());
|
||||
std::vector<std::string_view> child_expr_name;
|
||||
for (auto child : _children) {
|
||||
argument_template.emplace_back(nullptr, child->data_type(), child->expr_name());
|
||||
child_expr_name.emplace_back(child->expr_name());
|
||||
}
|
||||
|
||||
_function = SimpleFunctionFactory::instance().get_function(_fn.name.function_name,
|
||||
argument_template, _data_type);
|
||||
if (_function == nullptr) {
|
||||
std::string type_str;
|
||||
for (auto arg : argument_template) {
|
||||
type_str = type_str + " " + arg.type->get_name();
|
||||
}
|
||||
return Status::NotSupported(
|
||||
"Function {} is not implemented, input param type is {}, "
|
||||
"and return type is {}.",
|
||||
_fn.name.function_name, type_str, _data_type->get_name());
|
||||
}
|
||||
|
||||
VExpr::register_function_context(state, context);
|
||||
_expr_name = fmt::format("{}({})", _fn.name.function_name, child_expr_name);
|
||||
_function_name = _fn.name.function_name;
|
||||
|
||||
return Status::OK();
|
||||
}
|
||||
|
||||
Status VMatchPredicate::open(RuntimeState* state, VExprContext* context,
|
||||
FunctionContext::FunctionStateScope scope) {
|
||||
RETURN_IF_ERROR(VExpr::open(state, context, scope));
|
||||
RETURN_IF_ERROR(VExpr::init_function_context(context, scope, _function));
|
||||
if (scope == FunctionContext::THREAD_LOCAL) {
|
||||
context->fn_context(_fn_context_index)->set_function_state(scope, _inverted_index_ctx);
|
||||
}
|
||||
return Status::OK();
|
||||
}
|
||||
|
||||
void VMatchPredicate::close(RuntimeState* state, VExprContext* context,
|
||||
FunctionContext::FunctionStateScope scope) {
|
||||
VExpr::close_function_context(context, scope, _function);
|
||||
VExpr::close(state, context, scope);
|
||||
}
|
||||
|
||||
Status VMatchPredicate::execute(VExprContext* context, Block* block, int* result_column_id) {
|
||||
// TODO: not execute const expr again, but use the const column in function context
|
||||
doris::vectorized::ColumnNumbers arguments(_children.size());
|
||||
for (int i = 0; i < _children.size(); ++i) {
|
||||
int column_id = -1;
|
||||
RETURN_IF_ERROR(_children[i]->execute(context, block, &column_id));
|
||||
arguments[i] = column_id;
|
||||
}
|
||||
// call function
|
||||
size_t num_columns_without_result = block->columns();
|
||||
// prepare a column to save result
|
||||
block->insert({nullptr, _data_type, _expr_name});
|
||||
RETURN_IF_ERROR(_function->execute(context->fn_context(_fn_context_index), *block, arguments,
|
||||
num_columns_without_result, block->rows(), false));
|
||||
*result_column_id = num_columns_without_result;
|
||||
return Status::OK();
|
||||
}
|
||||
|
||||
const std::string& VMatchPredicate::expr_name() const {
|
||||
return _expr_name;
|
||||
}
|
||||
|
||||
const std::string& VMatchPredicate::function_name() const {
|
||||
return _function_name;
|
||||
}
|
||||
|
||||
std::string VMatchPredicate::debug_string() const {
|
||||
std::stringstream out;
|
||||
out << "MatchPredicate(" << children()[0]->debug_string() << ",[";
|
||||
int num_children = children().size();
|
||||
|
||||
for (int i = 1; i < num_children; ++i) {
|
||||
out << (i == 1 ? "" : " ") << children()[i]->debug_string();
|
||||
}
|
||||
|
||||
out << "])";
|
||||
return out.str();
|
||||
}
|
||||
|
||||
} // namespace doris::vectorized
|
||||
Reference in New Issue
Block a user