Pure DocValue optimization for doris-on-es Future todo: Today, for every tuple scan we check if pure_docvalue is enabled, this is not reasonable, should check pure_docvalue enabled for one whole scan outside, I will add this todo in future
128 lines
3.9 KiB
C++
128 lines
3.9 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#include "exec/es_http_scanner.h"
|
|
|
|
#include <sstream>
|
|
#include <iostream>
|
|
|
|
#include "runtime/descriptors.h"
|
|
#include "runtime/exec_env.h"
|
|
#include "runtime/mem_tracker.h"
|
|
#include "runtime/raw_value.h"
|
|
#include "runtime/runtime_state.h"
|
|
#include "runtime/tuple.h"
|
|
#include "exprs/expr.h"
|
|
|
|
namespace doris {
|
|
|
|
EsHttpScanner::EsHttpScanner(
|
|
RuntimeState* state,
|
|
RuntimeProfile* profile,
|
|
TupleId tuple_id,
|
|
const std::map<std::string, std::string>& properties,
|
|
const std::vector<ExprContext*>& conjunct_ctxs,
|
|
EsScanCounter* counter) :
|
|
_state(state),
|
|
_profile(profile),
|
|
_tuple_id(tuple_id),
|
|
_properties(properties),
|
|
_conjunct_ctxs(conjunct_ctxs),
|
|
_next_range(0),
|
|
_line_eof(false),
|
|
_batch_eof(false),
|
|
#if BE_TEST
|
|
_mem_tracker(new MemTracker()),
|
|
_mem_pool(_mem_tracker.get()),
|
|
#else
|
|
_mem_tracker(new MemTracker(-1, "EsHttp Scanner", state->instance_mem_tracker())),
|
|
_mem_pool(_state->instance_mem_tracker()),
|
|
#endif
|
|
_tuple_desc(nullptr),
|
|
_counter(counter),
|
|
_es_reader(nullptr),
|
|
_es_scroll_parser(nullptr),
|
|
_rows_read_counter(nullptr),
|
|
_read_timer(nullptr),
|
|
_materialize_timer(nullptr) {
|
|
}
|
|
|
|
EsHttpScanner::~EsHttpScanner() {
|
|
close();
|
|
}
|
|
|
|
Status EsHttpScanner::open() {
|
|
_tuple_desc = _state->desc_tbl().get_tuple_descriptor(_tuple_id);
|
|
if (_tuple_desc == nullptr) {
|
|
std::stringstream ss;
|
|
ss << "Unknown tuple descriptor, tuple_id=" << _tuple_id;
|
|
return Status::InternalError(ss.str());
|
|
}
|
|
|
|
const std::string& host = _properties.at(ESScanReader::KEY_HOST_PORT);
|
|
_es_reader.reset(new ESScanReader(host, _properties));
|
|
if (_es_reader == nullptr) {
|
|
return Status::InternalError("Es reader construct failed.");
|
|
}
|
|
|
|
RETURN_IF_ERROR(_es_reader->open());
|
|
|
|
_rows_read_counter = ADD_COUNTER(_profile, "RowsRead", TUnit::UNIT);
|
|
_read_timer = ADD_TIMER(_profile, "TotalRawReadTime(*)");
|
|
_materialize_timer = ADD_TIMER(_profile, "MaterializeTupleTime(*)");
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status EsHttpScanner::get_next(Tuple* tuple, MemPool* tuple_pool, bool* eof, const std::map<std::string, std::string>& docvalue_context) {
|
|
SCOPED_TIMER(_read_timer);
|
|
if (_line_eof && _batch_eof) {
|
|
*eof = true;
|
|
return Status::OK();
|
|
}
|
|
|
|
while (!_batch_eof) {
|
|
if (_line_eof || _es_scroll_parser == nullptr) {
|
|
RETURN_IF_ERROR(_es_reader->get_next(&_batch_eof, _es_scroll_parser));
|
|
if (_batch_eof) {
|
|
*eof = true;
|
|
return Status::OK();
|
|
}
|
|
}
|
|
|
|
COUNTER_UPDATE(_rows_read_counter, 1);
|
|
SCOPED_TIMER(_materialize_timer);
|
|
RETURN_IF_ERROR(_es_scroll_parser->fill_tuple(
|
|
_tuple_desc, tuple, tuple_pool, &_line_eof, docvalue_context));
|
|
if (!_line_eof) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
void EsHttpScanner::close() {
|
|
if (_es_reader != nullptr) {
|
|
_es_reader->close();
|
|
}
|
|
|
|
Expr::close(_conjunct_ctxs, _state);
|
|
}
|
|
|
|
}
|