Files
doris/be/src/runtime/thread_context.h
2022-08-01 09:44:04 +08:00

283 lines
10 KiB
C++

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#pragma once
#include <service/brpc_conflict.h>
// After brpc_conflict.h
#include <bthread/bthread.h>
#include <string>
#include <thread>
#include "common/logging.h"
#include "gen_cpp/PaloInternalService_types.h" // for TQueryType
#include "runtime/memory/thread_mem_tracker_mgr.h"
#include "runtime/threadlocal.h"
// Add thread mem tracker consumer during query execution.
#define SCOPED_CONSUME_MEM_TRACKER(mem_tracker) \
auto VARNAME_LINENUM(add_mem_consumer) = doris::AddThreadMemTrackerConsumer(mem_tracker)
#define SCOPED_UPDATE_MEM_EXCEED_CALL_BACK(cancel_msg, ...) \
auto VARNAME_LINENUM(update_exceed_cb) = \
doris::UpdateMemExceedCallBack(cancel_msg, ##__VA_ARGS__)
namespace doris {
class TUniqueId;
class ThreadContext;
extern bthread_key_t btls_key;
// Using gcc11 compiles thread_local variable on lower versions of GLIBC will report an error,
// see https://github.com/apache/doris/pull/7911
//
// If we want to avoid this error,
// 1. For non-trivial variables in thread_local, such as std::string, you need to store them as pointers to
// ensure that thread_local is trivial, these non-trivial pointers will uniformly call destructors elsewhere.
// 2. The default destructor of the thread_local variable cannot be overridden.
//
// This is difficult to implement. Because the destructor is not overwritten, it means that the outside cannot
// be notified when the thread terminates, and the non-trivial pointers in thread_local cannot be released in time.
// The func provided by pthread and std::thread doesn't help either.
//
// So, kudu Class-scoped static thread local implementation was introduced. Solve the above problem by
// Thread-scoped thread local + Class-scoped thread local.
//
// This may look very trick, but it's the best way I can find.
//
// refer to:
// https://gcc.gnu.org/onlinedocs/gcc-3.3.1/gcc/Thread-Local.html
// https://stackoverflow.com/questions/12049684/
// https://sourceware.org/glibc/wiki/Destructor%20support%20for%20thread_local%20variables
// https://www.jianshu.com/p/756240e837dd
// https://man7.org/linux/man-pages/man3/pthread_tryjoin_np.3.html
class ThreadContextPtr {
public:
ThreadContextPtr();
// Cannot add destructor `~ThreadContextPtr`, otherwise it will no longer be of type POD, the reason is as above.
// TCMalloc hook is triggered during ThreadContext construction, which may lead to deadlock.
bool _init = false;
DECLARE_STATIC_THREAD_LOCAL(ThreadContext, _ptr);
};
inline thread_local ThreadContextPtr thread_context_ptr;
// To avoid performance problems caused by frequently calling `bthread_getspecific` to obtain bthread TLS
// in tcmalloc hook, cache the key and value of bthread TLS in pthread TLS.
inline thread_local ThreadContext* bthread_context;
inline thread_local bthread_key_t bthread_context_key;
// The thread context saves some info about a working thread.
// 2 required info:
// 1. thread_id: Current thread id, Auto generated.
// 2. type: The type is a enum value indicating which type of task current thread is running.
// For example: QUERY, LOAD, COMPACTION, ...
// 3. task id: A unique id to identify this task. maybe query id, load job id, etc.
//
// There may be other optional info to be added later.
class ThreadContext {
public:
enum TaskType {
UNKNOWN = 0,
QUERY = 1,
LOAD = 2,
COMPACTION = 3,
STORAGE = 4,
BRPC = 5
// to be added ...
};
inline static const std::string TaskTypeStr[] = {"UNKNOWN", "QUERY", "LOAD", "COMPACTION",
"STORAGE"};
public:
ThreadContext() {
_thread_mem_tracker_mgr.reset(new ThreadMemTrackerMgr());
init();
}
~ThreadContext() {
// Restore to the memory state before _init=true to ensure accurate overall memory statistics.
// Thereby ensuring that the memory alloc size is not tracked during the initialization of the
// ThreadContext before `_init = true in ThreadContextPtr()`,
// Equal to the size of the memory release that is not tracked during the destruction of the
// ThreadContext after `_init = false in ~ThreadContextPtr()`,
init();
thread_context_ptr._init = false;
}
void init() {
_type = TaskType::UNKNOWN;
_thread_mem_tracker_mgr->init();
_thread_id = get_thread_id();
}
void attach_task(const TaskType& type, const std::string& task_id,
const TUniqueId& fragment_instance_id,
const std::shared_ptr<MemTrackerLimiter>& mem_tracker) {
DCHECK((_type == TaskType::UNKNOWN || _type == TaskType::BRPC) && _task_id == "")
<< ",new tracker label: " << mem_tracker->label() << ",old tracker label: "
<< _thread_mem_tracker_mgr->limiter_mem_tracker()->label();
DCHECK(type != TaskType::UNKNOWN);
_type = type;
_task_id = task_id;
_fragment_instance_id = fragment_instance_id;
_thread_mem_tracker_mgr->attach_limiter_tracker(TaskTypeStr[_type], task_id,
fragment_instance_id, mem_tracker);
}
void detach_task() {
_type = TaskType::UNKNOWN;
_task_id = "";
_fragment_instance_id = TUniqueId();
_thread_mem_tracker_mgr->detach_limiter_tracker();
}
const TaskType& type() const { return _type; }
const void set_type(const TaskType& type) { _type = type; }
const std::string& task_id() const { return _task_id; }
const std::string& thread_id_str() const { return _thread_id; }
const TUniqueId& fragment_instance_id() const { return _fragment_instance_id; }
std::string get_thread_id() {
std::stringstream ss;
ss << std::this_thread::get_id();
return ss.str();
}
// After _thread_mem_tracker_mgr is initialized, the current thread TCMalloc Hook starts to
// consume/release mem_tracker.
// Note that the use of shared_ptr will cause a crash. The guess is that there is an
// intermediate state during the copy construction of shared_ptr. Shared_ptr is not equal
// to nullptr, but the object it points to is not initialized. At this time, when the memory
// is released somewhere, the TCMalloc hook is triggered to cause the crash.
std::unique_ptr<ThreadMemTrackerMgr> _thread_mem_tracker_mgr;
private:
std::string _thread_id;
TaskType _type;
std::string _task_id;
TUniqueId _fragment_instance_id;
};
static void update_bthread_context() {
if (btls_key != bthread_context_key) {
// pthread switch occurs, updating bthread_context and bthread_context_key cached in pthread tls.
bthread_context = static_cast<ThreadContext*>(bthread_getspecific(btls_key));
bthread_context_key = btls_key;
}
}
static ThreadContext* thread_context() {
if (btls_key != EMPTY_BTLS_KEY && bthread_context != nullptr) {
update_bthread_context();
return bthread_context;
} else {
return thread_context_ptr._ptr;
}
}
class AttachTask {
public:
explicit AttachTask(const std::shared_ptr<MemTrackerLimiter>& mem_tracker,
const ThreadContext::TaskType& type = ThreadContext::TaskType::UNKNOWN,
const std::string& task_id = "",
const TUniqueId& fragment_instance_id = TUniqueId());
explicit AttachTask(RuntimeState* runtime_state);
const ThreadContext::TaskType query_to_task_type(const TQueryType::type& query_type) {
switch (query_type) {
case TQueryType::SELECT:
return ThreadContext::TaskType::QUERY;
case TQueryType::LOAD:
return ThreadContext::TaskType::LOAD;
default:
DCHECK(false);
return ThreadContext::TaskType::UNKNOWN;
}
}
~AttachTask();
};
class AddThreadMemTrackerConsumer {
public:
explicit AddThreadMemTrackerConsumer(MemTracker* mem_tracker);
~AddThreadMemTrackerConsumer();
};
class UpdateMemExceedCallBack {
public:
explicit UpdateMemExceedCallBack(const std::string& cancel_msg, bool cancel_task = true,
ExceedCallBack cb_func = nullptr);
~UpdateMemExceedCallBack();
private:
#ifdef USE_MEM_TRACKER
MemExceedCallBackInfo _old_cb;
#endif
};
class SwitchBthread {
public:
explicit SwitchBthread();
~SwitchBthread();
private:
#ifdef USE_MEM_TRACKER
ThreadContext* _bthread_context;
#endif
};
class StopCheckThreadMemTrackerLimit {
public:
explicit StopCheckThreadMemTrackerLimit() {
thread_context()->_thread_mem_tracker_mgr->set_check_limit(false);
}
~StopCheckThreadMemTrackerLimit() {
thread_context()->_thread_mem_tracker_mgr->set_check_limit(true);
}
};
#define SCOPED_SWITCH_BTHREAD_TLS() auto VARNAME_LINENUM(switch_bthread) = SwitchBthread()
// Attach to task when thread starts
#define SCOPED_ATTACH_TASK(arg1, ...) \
auto VARNAME_LINENUM(attach_task) = AttachTask(arg1, ##__VA_ARGS__)
#define STOP_CHECK_THREAD_MEM_TRACKER_LIMIT() \
auto VARNAME_LINENUM(stop_check_limit) = StopCheckThreadMemTrackerLimit()
#define CONSUME_THREAD_MEM_TRACKER(size) \
doris::thread_context()->_thread_mem_tracker_mgr->consume(size)
#define RELEASE_THREAD_MEM_TRACKER(size) \
doris::thread_context()->_thread_mem_tracker_mgr->consume(-size)
#define THREAD_MEM_TRACKER_TRANSFER_TO(size, tracker) \
doris::thread_context()->_thread_mem_tracker_mgr->transfer_to(size, tracker)
#define THREAD_MEM_TRACKER_TRANSFER_FROM(size, tracker) \
doris::thread_context()->_thread_mem_tracker_mgr->transfer_from(size, tracker)
} // namespace doris