1. MemTableFlushExecutor maintain a ThreadPool to receive FlushTask. 2. FlushToken is used to seperate different tasks from different tablets. Every DeltaWriter of tablet constructs a FlushToken, task in FlushToken are handle serially, task between FlushToken are handle concurrently. 3. I have remove thread limit on data_dir, because of I/O is not the main timer consumer of Flush thread. Much of time is consumed in CPU decoding and compress.
241 lines
9.2 KiB
C++
241 lines
9.2 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#include "runtime/exec_env.h"
|
|
|
|
#include <boost/algorithm/string.hpp>
|
|
|
|
#include "common/config.h"
|
|
#include "common/logging.h"
|
|
#include "runtime/broker_mgr.h"
|
|
#include "runtime/bufferpool/buffer_pool.h"
|
|
#include "runtime/client_cache.h"
|
|
#include "runtime/data_stream_mgr.h"
|
|
#include "runtime/disk_io_mgr.h"
|
|
#include "runtime/external_scan_context_mgr.h"
|
|
#include "runtime/result_buffer_mgr.h"
|
|
#include "runtime/result_queue_mgr.h"
|
|
#include "runtime/mem_tracker.h"
|
|
#include "runtime/thread_resource_mgr.h"
|
|
#include "runtime/fragment_mgr.h"
|
|
#include "runtime/load_channel_mgr.h"
|
|
#include "runtime/tmp_file_mgr.h"
|
|
#include "runtime/bufferpool/reservation_tracker.h"
|
|
#include "util/metrics.h"
|
|
#include "util/network_util.h"
|
|
#include "util/parse_util.h"
|
|
#include "util/mem_info.h"
|
|
#include "util/debug_util.h"
|
|
#include "olap/storage_engine.h"
|
|
#include "olap/page_cache.h"
|
|
#include "util/network_util.h"
|
|
#include "util/bfd_parser.h"
|
|
#include "runtime/etl_job_mgr.h"
|
|
#include "runtime/load_path_mgr.h"
|
|
#include "runtime/routine_load/routine_load_task_executor.h"
|
|
#include "runtime/stream_load/load_stream_mgr.h"
|
|
#include "runtime/stream_load/stream_load_executor.h"
|
|
#include "runtime/small_file_mgr.h"
|
|
#include "util/pretty_printer.h"
|
|
#include "util/doris_metrics.h"
|
|
#include "util/brpc_stub_cache.h"
|
|
#include "util/priority_thread_pool.hpp"
|
|
#include "agent/cgroups_mgr.h"
|
|
#include "gen_cpp/BackendService.h"
|
|
#include "gen_cpp/FrontendService.h"
|
|
#include "gen_cpp/TPaloBrokerService.h"
|
|
#include "gen_cpp/TExtDataSourceService.h"
|
|
#include "gen_cpp/HeartbeatService_types.h"
|
|
#include "runtime/heartbeat_flags.h"
|
|
|
|
namespace doris {
|
|
|
|
Status ExecEnv::init(ExecEnv* env, const std::vector<StorePath>& store_paths) {
|
|
return env->_init(store_paths);
|
|
}
|
|
|
|
Status ExecEnv::_init(const std::vector<StorePath>& store_paths) {
|
|
_store_paths = store_paths;
|
|
_external_scan_context_mgr = new ExternalScanContextMgr(this);
|
|
_metrics = DorisMetrics::metrics();
|
|
_stream_mgr = new DataStreamMgr();
|
|
_result_mgr = new ResultBufferMgr();
|
|
_result_queue_mgr = new ResultQueueMgr();
|
|
_backend_client_cache = new BackendServiceClientCache(config::max_client_cache_size_per_host);
|
|
_frontend_client_cache = new FrontendServiceClientCache(config::max_client_cache_size_per_host);
|
|
_broker_client_cache = new BrokerServiceClientCache(config::max_client_cache_size_per_host);
|
|
_extdatasource_client_cache = new ExtDataSourceServiceClientCache(config::max_client_cache_size_per_host);
|
|
_mem_tracker = nullptr;
|
|
_pool_mem_trackers = new PoolMemTrackerRegistry();
|
|
_thread_mgr = new ThreadResourceMgr();
|
|
_thread_pool = new PriorityThreadPool(
|
|
config::doris_scanner_thread_pool_thread_num,
|
|
config::doris_scanner_thread_pool_queue_size);
|
|
_etl_thread_pool = new PriorityThreadPool(
|
|
config::etl_thread_pool_size,
|
|
config::etl_thread_pool_queue_size);
|
|
_cgroups_mgr = new CgroupsMgr(this, config::doris_cgroups);
|
|
_fragment_mgr = new FragmentMgr(this);
|
|
_master_info = new TMasterInfo();
|
|
_etl_job_mgr = new EtlJobMgr(this);
|
|
_load_path_mgr = new LoadPathMgr(this);
|
|
_disk_io_mgr = new DiskIoMgr();
|
|
_tmp_file_mgr = new TmpFileMgr(this),
|
|
_bfd_parser = BfdParser::create();
|
|
_broker_mgr = new BrokerMgr(this);
|
|
_load_channel_mgr = new LoadChannelMgr();
|
|
_load_stream_mgr = new LoadStreamMgr();
|
|
_brpc_stub_cache = new BrpcStubCache();
|
|
_stream_load_executor = new StreamLoadExecutor(this);
|
|
_routine_load_task_executor = new RoutineLoadTaskExecutor(this);
|
|
_small_file_mgr = new SmallFileMgr(this, config::small_file_dir);
|
|
|
|
_backend_client_cache->init_metrics(DorisMetrics::metrics(), "backend");
|
|
_frontend_client_cache->init_metrics(DorisMetrics::metrics(), "frontend");
|
|
_broker_client_cache->init_metrics(DorisMetrics::metrics(), "broker");
|
|
_extdatasource_client_cache->init_metrics(DorisMetrics::metrics(), "extdatasource");
|
|
_result_mgr->init();
|
|
_cgroups_mgr->init_cgroups();
|
|
_etl_job_mgr->init();
|
|
Status status = _load_path_mgr->init();
|
|
if (!status.ok()) {
|
|
LOG(ERROR) << "load path mgr init failed." << status.get_error_msg();
|
|
exit(-1);
|
|
}
|
|
_broker_mgr->init();
|
|
_small_file_mgr->init();
|
|
_init_mem_tracker();
|
|
|
|
RETURN_IF_ERROR(_load_channel_mgr->init(_mem_tracker->limit()));
|
|
_heartbeat_flags = new HeartbeatFlags();
|
|
return Status::OK();
|
|
}
|
|
|
|
Status ExecEnv::_init_mem_tracker() {
|
|
// Initialize global memory limit.
|
|
int64_t bytes_limit = 0;
|
|
bool is_percent = false;
|
|
std::stringstream ss;
|
|
// --mem_limit="" means no memory limit
|
|
bytes_limit = ParseUtil::parse_mem_spec(config::mem_limit, &is_percent);
|
|
if (bytes_limit < 0) {
|
|
ss << "Failed to parse mem limit from '" + config::mem_limit + "'.";
|
|
return Status::InternalError(ss.str());
|
|
}
|
|
|
|
if (!BitUtil::IsPowerOf2(config::min_buffer_size)) {
|
|
ss << "--min_buffer_size must be a power-of-two: " << config::min_buffer_size;
|
|
return Status::InternalError(ss.str());
|
|
}
|
|
|
|
int64_t buffer_pool_limit = ParseUtil::parse_mem_spec(
|
|
config::buffer_pool_limit, &is_percent);
|
|
if (buffer_pool_limit <= 0) {
|
|
ss << "Invalid --buffer_pool_limit value, must be a percentage or "
|
|
"positive bytes value or percentage: " << config::buffer_pool_limit;
|
|
return Status::InternalError(ss.str());
|
|
}
|
|
buffer_pool_limit = BitUtil::RoundDown(buffer_pool_limit, config::min_buffer_size);
|
|
|
|
int64_t clean_pages_limit = ParseUtil::parse_mem_spec(
|
|
config::buffer_pool_clean_pages_limit, &is_percent);
|
|
if (clean_pages_limit <= 0) {
|
|
ss << "Invalid --buffer_pool_clean_pages_limit value, must be a percentage or "
|
|
"positive bytes value or percentage: " << config::buffer_pool_clean_pages_limit;
|
|
return Status::InternalError(ss.str());
|
|
}
|
|
|
|
_init_buffer_pool(config::min_buffer_size, buffer_pool_limit, clean_pages_limit);
|
|
|
|
// Limit of 0 means no memory limit.
|
|
if (bytes_limit > 0) {
|
|
_mem_tracker = new MemTracker(bytes_limit);
|
|
}
|
|
|
|
if (bytes_limit > MemInfo::physical_mem()) {
|
|
LOG(WARNING) << "Memory limit "
|
|
<< PrettyPrinter::print(bytes_limit, TUnit::BYTES)
|
|
<< " exceeds physical memory of "
|
|
<< PrettyPrinter::print(MemInfo::physical_mem(),
|
|
TUnit::BYTES);
|
|
}
|
|
|
|
LOG(INFO) << "Using global memory limit: " << PrettyPrinter::print(bytes_limit, TUnit::BYTES);
|
|
RETURN_IF_ERROR(_disk_io_mgr->init(_mem_tracker));
|
|
RETURN_IF_ERROR(_tmp_file_mgr->init(DorisMetrics::metrics()));
|
|
|
|
int64_t storage_cache_limit = ParseUtil::parse_mem_spec(
|
|
config::storage_page_cache_limit, &is_percent);
|
|
if (storage_cache_limit > MemInfo::physical_mem()) {
|
|
LOG(WARNING) << "Config storage_page_cache_limit is greater than memory size, config="
|
|
<< config::storage_page_cache_limit
|
|
<< ", memory=" << MemInfo::physical_mem();
|
|
}
|
|
StoragePageCache::create_global_cache(storage_cache_limit);
|
|
|
|
// TODO(zc): The current memory usage configuration is a bit confusing,
|
|
// we need to sort out the use of memory
|
|
return Status::OK();
|
|
}
|
|
|
|
void ExecEnv::_init_buffer_pool(int64_t min_page_size,
|
|
int64_t capacity,
|
|
int64_t clean_pages_limit) {
|
|
DCHECK(_buffer_pool == nullptr);
|
|
_buffer_pool = new BufferPool(min_page_size, capacity, clean_pages_limit);
|
|
_buffer_reservation = new ReservationTracker();
|
|
_buffer_reservation->InitRootTracker(nullptr, capacity);
|
|
}
|
|
|
|
void ExecEnv::_destory() {
|
|
delete _brpc_stub_cache;
|
|
delete _load_stream_mgr;
|
|
delete _load_channel_mgr;
|
|
delete _broker_mgr;
|
|
delete _bfd_parser;
|
|
delete _tmp_file_mgr;
|
|
delete _disk_io_mgr;
|
|
delete _load_path_mgr;
|
|
delete _etl_job_mgr;
|
|
delete _master_info;
|
|
delete _fragment_mgr;
|
|
delete _cgroups_mgr;
|
|
delete _etl_thread_pool;
|
|
delete _thread_pool;
|
|
delete _thread_mgr;
|
|
delete _pool_mem_trackers;
|
|
delete _mem_tracker;
|
|
delete _broker_client_cache;
|
|
delete _extdatasource_client_cache;
|
|
delete _frontend_client_cache;
|
|
delete _backend_client_cache;
|
|
delete _result_mgr;
|
|
delete _result_queue_mgr;
|
|
delete _stream_mgr;
|
|
delete _stream_load_executor;
|
|
delete _routine_load_task_executor;
|
|
delete _external_scan_context_mgr;
|
|
delete _heartbeat_flags;
|
|
_metrics = nullptr;
|
|
}
|
|
|
|
void ExecEnv::destroy(ExecEnv* env) {
|
|
env->_destory();
|
|
}
|
|
|
|
}
|