Files
oceanbase/src/storage/ob_tenant_tablet_stat_mgr.cpp
2024-02-08 03:42:03 +00:00

976 lines
29 KiB
C++

/**
* Copyright (c) 2023 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX STORAGE
#include "lib/oblog/ob_log_module.h"
#include "share/ob_force_print_log.h"
#include "share/ob_thread_mgr.h"
#include "storage/ob_tenant_tablet_stat_mgr.h"
#include "observer/ob_server_struct.h"
#include "observer/ob_server.h"
#include <sys/sysinfo.h>
using namespace oceanbase;
using namespace oceanbase::common;
using namespace oceanbase::storage;
bool ObTransNodeDMLStat::empty() const
{
return 0 >= insert_row_count_ &&
0 >= update_row_count_ &&
0 >= delete_row_count_;
}
void ObTransNodeDMLStat::atomic_inc(const ObTransNodeDMLStat &other)
{
if (other.empty()) {
// do nothing
} else {
(void) ATOMIC_AAFx(&insert_row_count_, other.insert_row_count_, 0/*placeholder*/);
(void) ATOMIC_AAFx(&update_row_count_, other.update_row_count_, 0/*placeholder*/);
(void) ATOMIC_AAFx(&delete_row_count_, other.delete_row_count_, 0/*placeholder*/);
}
}
/************************************* ObTabletStatKey *************************************/
ObTabletStatKey::ObTabletStatKey(
const int64_t ls_id,
const uint64_t tablet_id)
: ls_id_(ls_id),
tablet_id_(tablet_id)
{
}
ObTabletStatKey::ObTabletStatKey(
const share::ObLSID ls_id,
const ObTabletID tablet_id)
: ls_id_(ls_id),
tablet_id_(tablet_id)
{
}
ObTabletStatKey::~ObTabletStatKey()
{
}
void ObTabletStatKey::reset()
{
ls_id_.reset();
tablet_id_.reset();
}
uint64_t ObTabletStatKey::hash() const
{
uint64_t hash_val = 0;
hash_val += ls_id_.hash();
hash_val += tablet_id_.hash();
return hash_val;
}
int ObTabletStatKey::hash(uint64_t &hash_val) const
{
hash_val = hash();
return OB_SUCCESS;
}
bool ObTabletStatKey::is_valid() const
{
return ls_id_.is_valid() && tablet_id_.is_valid();
}
bool ObTabletStatKey::operator==(const ObTabletStatKey &other) const
{
bool bret = true;
if (this == &other) {
} else if (ls_id_ != other.ls_id_ || tablet_id_ != other.tablet_id_) {
bret = false;
}
return bret;
}
bool ObTabletStatKey::operator!=(const ObTabletStatKey &other) const
{
return !(*this == other);
}
/************************************* ObTabletStat *************************************/
bool ObTabletStat::is_valid() const
{
return ls_id_ > 0 && tablet_id_ > 0;
}
bool ObTabletStat::check_need_report() const
{
bool bret = false;
ObTabletID tablet_id(tablet_id_);
if (tablet_id.is_ls_inner_tablet()) {
// do nothing
} else if (0 < merge_cnt_) { // report by compaction
bret = get_total_merge_row_count() >= MERGE_REPORT_MIN_ROW_CNT;
} else if (0 < query_cnt_) { // only report the slow query
const int64_t boost_factor = tablet_id.is_inner_tablet() ? 2 : 1;
if (scan_physical_row_cnt_ > 0 &&
scan_physical_row_cnt_ >= scan_logical_row_cnt_ * QUERY_REPORT_INEFFICIENT_THRESHOLD * boost_factor) {
bret = true;
}
if (!bret && scan_micro_block_cnt_ > 0 &&
scan_micro_block_cnt_ >= pushdown_micro_block_cnt_ * QUERY_REPORT_INEFFICIENT_THRESHOLD * boost_factor) {
bret = true;
}
if (!bret && exist_row_total_table_cnt_ > 0 &&
exist_row_total_table_cnt_ >= exist_row_read_table_cnt_ * QUERY_REPORT_INEFFICIENT_THRESHOLD * boost_factor) {
bret = true;
}
}
return bret;
}
ObTabletStat& ObTabletStat::operator=(const ObTabletStat &other)
{
if (this != &other) {
MEMCPY(this, &other, sizeof(ObTabletStat));
}
return *this;
}
ObTabletStat& ObTabletStat::operator+=(const ObTabletStat &other)
{
if (other.is_valid()) {
ls_id_ = other.ls_id_;
tablet_id_ = other.tablet_id_;
query_cnt_ += other.query_cnt_;
merge_cnt_ += other.merge_cnt_;
scan_logical_row_cnt_ += other.scan_logical_row_cnt_;
scan_physical_row_cnt_ += other.scan_physical_row_cnt_;
scan_micro_block_cnt_ += other.scan_micro_block_cnt_;
pushdown_micro_block_cnt_ += other.pushdown_micro_block_cnt_;
exist_row_total_table_cnt_ += other.exist_row_total_table_cnt_;
exist_row_read_table_cnt_ += other.exist_row_read_table_cnt_;
insert_row_cnt_ += other.insert_row_cnt_;
update_row_cnt_ += other.update_row_cnt_;
delete_row_cnt_ += other.delete_row_cnt_;
}
return *this;
}
ObTabletStat& ObTabletStat::archive(int64_t factor)
{
if (factor > 0) {
query_cnt_ /= factor;
merge_cnt_ /= factor;
scan_logical_row_cnt_ /= factor;
scan_physical_row_cnt_ /= factor;
scan_micro_block_cnt_ /= factor;
pushdown_micro_block_cnt_ /= factor;
exist_row_total_table_cnt_ /= factor;
exist_row_read_table_cnt_ /= factor;
insert_row_cnt_ /= factor;
update_row_cnt_ /= factor;
delete_row_cnt_ /= factor;
}
return *this;
}
/************************************* ObTabletStatAnalyzer *************************************/
ObTabletStatAnalyzer::ObTabletStatAnalyzer()
: tablet_stat_(),
boost_factor_(1),
is_small_tenant_(false)
{
}
bool ObTabletStatAnalyzer::is_hot_tablet() const
{
return tablet_stat_.query_cnt_ + tablet_stat_.merge_cnt_ >= ACCESS_FREQUENCY * boost_factor_;
}
bool ObTabletStatAnalyzer::is_insert_mostly() const
{
bool bret = false;
ObTabletID tablet_id(tablet_stat_.tablet_id_);
uint64_t total_row_cnt = tablet_stat_.get_total_merge_row_count();
if (tablet_id.is_inner_tablet() || tablet_id.is_ls_inner_tablet()) {
// do nothing
} else if (0 == tablet_stat_.insert_row_cnt_) {
// no insert occurs
} else if (total_row_cnt < MERGE_BASIC_ROW_CNT * boost_factor_) {
// do nothing
} else {
bret = total_row_cnt * LOAD_THRESHOLD <= tablet_stat_.insert_row_cnt_ * BASE_FACTOR;
}
return bret;
}
bool ObTabletStatAnalyzer::is_update_or_delete_mostly() const
{
bool bret = false;
uint64_t total_row_cnt = tablet_stat_.get_total_merge_row_count();
if (0 == tablet_stat_.delete_row_cnt_ + tablet_stat_.update_row_cnt_) {
// no update && delete occurs
} else if (total_row_cnt < MERGE_BASIC_ROW_CNT * boost_factor_) {
// do nothing
} else {
bret = total_row_cnt * TOMBSTONE_THRESHOLD * boost_factor_ <= (tablet_stat_.update_row_cnt_ + tablet_stat_.delete_row_cnt_) * BASE_FACTOR;
}
return bret;
}
bool ObTabletStatAnalyzer::has_slow_query() const
{
bool bret = false;
// all tablet query stats are ineffecient, only check the basic threshold
if (tablet_stat_.scan_physical_row_cnt_ >= QUERY_BASIC_ROW_CNT * boost_factor_ ||
tablet_stat_.scan_micro_block_cnt_ >= QUERY_BASIC_MICRO_BLOCK_CNT * boost_factor_ ||
tablet_stat_.exist_row_total_table_cnt_ >= QUERY_BASIC_ITER_TABLE_CNT * boost_factor_) {
bret = true;
}
return bret;
}
/************************************* ObTenantSysStat *************************************/
ObTenantSysStat::ObTenantSysStat()
: cpu_usage_percentage_(0),
min_cpu_cnt_(0),
max_cpu_cnt_(0),
memory_hold_(0),
memory_limit_(0)
{
}
void ObTenantSysStat::reset()
{
cpu_usage_percentage_ = 0;
min_cpu_cnt_ = 0;
max_cpu_cnt_ = 0;
memory_hold_ = 0;
memory_limit_ = 0;
}
bool ObTenantSysStat::is_small_tenant() const
{
bool bret = false;
// 8c16g
const int64_t cpu_threshold = 8;
// When the tenant memory exceeds 10GB, the meta tenant occupies at least 10% of the memory.
const int64_t mem_threshold = (16L << 30) * 9 / 10;
bret = max_cpu_cnt_ < cpu_threshold || memory_limit_ < mem_threshold;
return bret;
}
bool ObTenantSysStat::is_full_cpu_usage() const
{
bool bret = false;
if (is_small_tenant()) {
bret = 75 <= cpu_usage_percentage_;
} else {
bret = 85 <= cpu_usage_percentage_;
}
return bret;
}
/************************************* ObTabletStream *************************************/
ObTabletStream::ObTabletStream()
: key_(),
curr_buckets_(CURR_BUCKET_STEP),
latest_buckets_(LATEST_BUCKET_STEP),
past_buckets_(PAST_BUCKET_STEP)
{
}
ObTabletStream::~ObTabletStream()
{
}
void ObTabletStream::reset()
{
key_.reset();
curr_buckets_.reset();
latest_buckets_.reset();
past_buckets_.reset();
}
void ObTabletStream::add_stat(const ObTabletStat &stat)
{
if (!key_.is_valid()) {
key_.ls_id_ = stat.ls_id_;
key_.tablet_id_ = stat.tablet_id_;
}
if (key_.ls_id_.id() == stat.ls_id_ && key_.tablet_id_.id() == stat.tablet_id_) {
curr_buckets_.add(stat);
}
}
void ObTabletStream::refresh()
{
ObTabletStat tablet_stat;
bool has_retired_stat = false;
curr_buckets_.refresh(tablet_stat, has_retired_stat);
latest_buckets_.refresh(tablet_stat, has_retired_stat);
past_buckets_.refresh(tablet_stat, has_retired_stat);
}
int ObTabletStream::get_all_tablet_stat(common::ObIArray<ObTabletStat> &tablet_stats) const
{
int ret = OB_SUCCESS;
if (OB_FAIL(get_bucket_tablet_stat(curr_buckets_, tablet_stats))) {
LOG_WARN("failed to get bucket tablet stat in past bucket", K(ret));
} else if (OB_FAIL(get_bucket_tablet_stat(latest_buckets_, tablet_stats))) {
LOG_WARN("failed to get bucket tablet stat in latest bucket", K(ret));
} else if (OB_FAIL(get_bucket_tablet_stat(past_buckets_, tablet_stats))) {
LOG_WARN("failed to get bucket tablet stat in curr bucket", K(ret));
}
return ret;
}
/************************************* ObTabletStreamPool *************************************/
ObTabletStreamPool::ObTabletStreamPool()
: dynamic_allocator_(MTL_ID()),
free_list_allocator_(ObMemAttr(MTL_ID(), "FreeTbltStream")),
free_list_(),
lru_list_(),
max_free_list_num_(0),
max_dynamic_node_num_(0),
allocated_dynamic_num_(0),
is_inited_(false)
{
}
ObTabletStreamPool::~ObTabletStreamPool()
{
destroy();
}
void ObTabletStreamPool::destroy()
{
is_inited_ = false;
ObTabletStreamNode *node = nullptr;
DLIST_REMOVE_ALL_NORET(node, lru_list_) {
lru_list_.remove(node);
if (DYNAMIC_ALLOC == node->flag_) {
node->~ObTabletStreamNode();
// ObFIFOAllocator::reset does not release memory by default.
dynamic_allocator_.free(node);
} else {
node->~ObTabletStreamNode();
}
node = nullptr;
}
lru_list_.reset();
while (OB_SUCCESS == free_list_.pop(node)) {
if (OB_NOT_NULL(node)) {
node->~ObTabletStreamNode();
node = nullptr;
}
}
dynamic_allocator_.reset();
free_list_.destroy();
free_list_allocator_.reset();
}
int ObTabletStreamPool::init(
const int64_t max_free_list_num,
const int64_t max_dynamic_node_num)
{
int ret = OB_SUCCESS;
const char *LABEL = "IncTbltStream";
ObTabletStreamNode *buf = nullptr;
if (IS_INIT) {
ret = OB_INIT_TWICE;
LOG_WARN("ObTabletStreamPool has been inited", K(ret));
} else if (max_free_list_num <= 0 || max_dynamic_node_num < 0) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("get invalid argument", K(ret), K(max_free_list_num), K(max_dynamic_node_num));
} else if (OB_FAIL(dynamic_allocator_.init(ObMallocAllocator::get_instance(), OB_MALLOC_NORMAL_BLOCK_SIZE,
ObMemAttr(MTL_ID(), LABEL)))) {
LOG_WARN("failed to init fifo allocator", K(ret));
} else if (OB_FAIL(free_list_.init(max_free_list_num, &free_list_allocator_))) {
LOG_WARN("failed to init free list", K(ret), K(max_free_list_num));
} else if (OB_ISNULL(buf = static_cast<ObTabletStreamNode*>(free_list_allocator_.alloc(sizeof(ObTabletStreamNode) * max_free_list_num)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("failed to allocate memory for stream node in free list", K(ret), K(max_free_list_num));
} else {
ObTabletStreamNode *node = nullptr;
for (int64_t i = 0; OB_SUCC(ret) && i < max_free_list_num; ++i) {
node = new (buf + i) ObTabletStreamNode(FIXED_ALLOC);
if (OB_FAIL(free_list_.push(node))) {
LOG_WARN("failed to push node to free list", K(ret));
}
}
if (OB_FAIL(ret)) {
destroy();
} else {
max_free_list_num_ = max_free_list_num;
max_dynamic_node_num_ = max_dynamic_node_num;
is_inited_ = true;
}
}
return ret;
}
int ObTabletStreamPool::alloc(ObTabletStreamNode *&free_node, bool &is_retired)
{
int ret = OB_SUCCESS;
is_retired = false;
void *buf = nullptr;
// 1. try to alloc node from free_list
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTabletStreamPool not inited", K(ret));
} else if (OB_NOT_NULL(free_node)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("get invalid argument", K(ret), K(free_node));
} else if (OB_FAIL(free_list_.pop(free_node))) {
if (OB_ENTRY_NOT_EXIST != ret) {
LOG_WARN("failed to pop free node from free list", K(ret));
}
}
// 2. no free node in free_list, try to alloc node dynamically
if (OB_ENTRY_NOT_EXIST == ret) {
ret = OB_SUCCESS;
if (allocated_dynamic_num_ >= max_dynamic_node_num_) {
ret = OB_SIZE_OVERFLOW;
} else if (OB_ISNULL(buf = dynamic_allocator_.alloc(sizeof(ObTabletStreamNode)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("failed to allocate memory for free node", K(ret));
} else {
free_node = new (buf) ObTabletStreamNode(DYNAMIC_ALLOC);
++allocated_dynamic_num_;
}
}
// 3. dynamic node has reached the upper limit, try to retire the oldest node in lru_list
if (OB_SIZE_OVERFLOW == ret) {
ret = OB_SUCCESS;
if (lru_list_.is_empty()) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("lru list is unexpected null", K(ret));
} else {
free_node = lru_list_.get_last();
is_retired = true;
}
}
return ret;
}
void ObTabletStreamPool::free(ObTabletStreamNode *node)
{
if (OB_NOT_NULL(node)) {
int tmp_ret = OB_SUCCESS;
if (IS_NOT_INIT) {
tmp_ret = OB_NOT_INIT;
LOG_ERROR_RET(tmp_ret, "[MEMORY LEAK] ObTabletStreamPool is not inited, cannot free this node!!!",
K(tmp_ret), KPC(node));
} else if (DYNAMIC_ALLOC == node->flag_) {
node->~ObTabletStreamNode();
dynamic_allocator_.free(node);
--allocated_dynamic_num_;
} else {
node->~ObTabletStreamNode();
OB_ASSERT(OB_SUCCESS == free_list_.push(node));
}
}
}
/************************************* ObTenantSysLoadShedder *************************************/
ObTenantSysLoadShedder::ObTenantSysLoadShedder()
{
reset();
}
void ObTenantSysLoadShedder::reset()
{
MEMSET(this, 0, sizeof(ObTenantSysLoadShedder));
load_shedding_factor_ = 1;
}
void ObTenantSysLoadShedder::refresh_sys_load()
{
if (load_shedding_factor_ > 1 &&
ObTimeUtility::fast_current_time() < effect_time_ + SHEDDER_EXPIRE_TIME) {
// do nothing
} else if (REACH_TENANT_TIME_INTERVAL(CPU_TIME_SAMPLING_INTERVAL)) {
load_shedding_factor_ = 1;
int tmp_ret = OB_SUCCESS;
double max_cpu_cnt = 0;
double min_cpu_cnt = 0;
if (OB_TMP_FAIL(GCTX.omt_->get_tenant_cpu(MTL_ID(), min_cpu_cnt, max_cpu_cnt))) {
LOG_WARN_RET(tmp_ret, "failed to get tennant cpu cnt", "tenant_id", MTL_ID());
} else {
min_cpu_cnt_ = min_cpu_cnt;
max_cpu_cnt_ = max_cpu_cnt;
}
if (min_cpu_cnt_ > 0 && max_cpu_cnt_ > 0) {
(void) refresh_cpu_utility();
}
}
}
int ObTenantSysLoadShedder::refresh_cpu_utility()
{
int ret = OB_SUCCESS;
int64_t curr_cpu_time = last_cpu_time_;
int64_t inc_cpu_time = 0;
int64_t physical_cpu_utility = 0;
if (OB_FAIL(GCTX.omt_->get_tenant_cpu_time(MTL_ID(), curr_cpu_time))) {
LOG_WARN("failed to get tennant cpu cnt", K(ret));
} else {
const int64_t curr_sample_time = ObTimeUtility::fast_current_time();
if (0 == last_sample_time_ || 0 == last_cpu_time_) {
// first time sample, no need to calculate cpu utility
} else {
inc_cpu_time = curr_cpu_time - last_cpu_time_;
physical_cpu_utility = inc_cpu_time * 100 / (curr_sample_time - last_sample_time_);
}
if (physical_cpu_utility > max_cpu_cnt_ * 100) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("cpu utility unexpected bigger than cpu cnt", K(ret), K(max_cpu_cnt_),
K(physical_cpu_utility), K(inc_cpu_time), K(curr_sample_time), K(last_sample_time_));
} else if (physical_cpu_utility >= max_cpu_cnt_ * 100 * CPU_TIME_THRESHOLD) {
ATOMIC_STORE(&load_shedding_factor_, DEFAULT_LOAD_SHEDDING_FACTOR);
effect_time_ = ObTimeUtility::fast_current_time();
FLOG_INFO("[ADAPTIVE_SCHED] refresh cpu utility", K(ret), K(load_shedding_factor_), K(max_cpu_cnt_),
K(physical_cpu_utility), K(inc_cpu_time), K(curr_sample_time), K(last_sample_time_), K(curr_cpu_time), K(last_cpu_time_));
}
last_sample_time_ = curr_sample_time;
last_cpu_time_ = curr_cpu_time;
}
return ret;
}
/************************************* ObTenantTabletStatMgr *************************************/
ObTenantTabletStatMgr::ObTenantTabletStatMgr()
: report_stat_task_(*this),
stream_pool_(),
stream_map_(),
bucket_lock_(),
report_queue_(),
load_shedder_(),
report_cursor_(0),
pending_cursor_(0),
report_tg_id_(0),
is_inited_(false)
{
}
ObTenantTabletStatMgr::~ObTenantTabletStatMgr()
{
destroy();
}
int ObTenantTabletStatMgr::init(const int64_t tenant_id)
{
int ret = OB_SUCCESS;
const bool repeat = true;
int64_t bucket_num = DEFAULT_BUCKET_NUM;
if (IS_INIT) {
ret = OB_INIT_TWICE;
LOG_WARN("ObTenantTabletStatMgr init twice", K(ret));
} else if (OB_FAIL(stream_pool_.init(DEFAULT_MAX_FREE_STREAM_CNT, DEFAULT_UP_LIMIT_STREAM_CNT))) {
LOG_WARN("failed to init tablet stream pool", K(ret));
} else if (OB_FAIL(stream_map_.create(DEFAULT_BUCKET_NUM, ObMemAttr(tenant_id, "TabletStats")))) {
LOG_WARN("failed to create TabletStats", K(ret));
} else if (FALSE_IT(bucket_num = stream_map_.bucket_count())) {
} else if (OB_FAIL(bucket_lock_.init(bucket_num, ObLatchIds::DEFAULT_BUCKET_LOCK,
ObMemAttr(tenant_id, "TabStatMgrLock")))) {
LOG_WARN("failed to init bucket lock", K(ret));
} else if (OB_FAIL(TG_CREATE_TENANT(lib::TGDefIDs::TabletStatRpt, report_tg_id_))) {
LOG_WARN("failed to create TabletStatRpt thread", K(ret));
} else if (OB_FAIL(TG_START(report_tg_id_))) {
LOG_WARN("failed to start stat TabletStatRpt thread", K(ret));
} else if (OB_FAIL(TG_SCHEDULE(report_tg_id_, report_stat_task_, TABLET_STAT_PROCESS_INTERVAL, repeat))) {
LOG_WARN("failed to schedule tablet stat update task", K(ret));
} else {
load_shedder_.refresh_sys_load();
is_inited_ = true;
}
if (!is_inited_) {
reset();
}
return ret;
}
int ObTenantTabletStatMgr::mtl_init(ObTenantTabletStatMgr* &tablet_stat_mgr)
{
int ret = OB_SUCCESS;
if (OB_FAIL(tablet_stat_mgr->init(MTL_ID()))) {
LOG_WARN("failed to init tablet stat mgr", K(ret), K(MTL_ID()));
} else {
LOG_INFO("success to init ObTenantTabletStatMgr", K(MTL_ID()));
}
return ret;
}
void ObTenantTabletStatMgr::wait()
{
TG_WAIT(report_tg_id_);
}
void ObTenantTabletStatMgr::stop()
{
TG_STOP(report_tg_id_);
}
void ObTenantTabletStatMgr::destroy()
{
if (IS_INIT) {
reset();
}
}
void ObTenantTabletStatMgr::reset()
{
stop();
wait();
TG_DESTROY(report_tg_id_);
{
ObBucketWLockAllGuard lock_guard(bucket_lock_);
stream_map_.destroy();
stream_pool_.destroy();
report_cursor_ = 0;
pending_cursor_ = 0;
report_tg_id_ = 0;
is_inited_ = false;
}
bucket_lock_.destroy();
load_shedder_.reset();
FLOG_INFO("ObTenantTabletStatMgr destroyed!");
}
int ObTenantTabletStatMgr::report_stat(
const ObTabletStat &stat,
bool &succ_report)
{
int ret = OB_SUCCESS;
succ_report = false;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTenantTabletStatMgr not inited", K(ret));
} else if (OB_UNLIKELY(!stat.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("get invalid arguments", K(ret), K(stat));
} else if (!stat.check_need_report()) {
} else {
uint64_t pending_cur = pending_cursor_;
if (pending_cur - report_cursor_ >= DEFAULT_MAX_PENDING_CNT) { // first check full queue with dirty read
if (REACH_TENANT_TIME_INTERVAL(10 * 1000L * 1000L/*10s*/)) {
LOG_INFO("report_queue is full, wait to process", K(report_cursor_), K(pending_cur), K(stat));
}
} else if (FALSE_IT(pending_cur = ATOMIC_FAA(&pending_cursor_, 1))) {
} else if (pending_cur - report_cursor_ >= DEFAULT_MAX_PENDING_CNT) { // double check
if (REACH_TENANT_TIME_INTERVAL(10 * 1000L * 1000L/*10s*/)) {
LOG_INFO("report_queue is full, wait to process", K(report_cursor_), K(pending_cur), K(stat));
}
} else {
report_queue_[pending_cur % DEFAULT_MAX_PENDING_CNT] = stat;
succ_report = true;
}
}
return ret;
}
int ObTenantTabletStatMgr::get_latest_tablet_stat(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
ObTabletStat &tablet_stat)
{
int ret = OB_SUCCESS;
tablet_stat.reset();
tablet_stat.ls_id_ = ls_id.id();
tablet_stat.tablet_id_ = tablet_id.id();
const ObTabletStatKey key(ls_id, tablet_id);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTenantTabletStatMgr not inited", K(ret));
} else if (OB_UNLIKELY(!key.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("get invalid arguments", K(ret), K(ls_id), K(tablet_id));
} else {
ObTabletStreamNode *stream_node = nullptr;
ObBucketHashRLockGuard lock_guard(bucket_lock_, key.hash());
if (OB_FAIL(stream_map_.get_refactored(key, stream_node))) {
if (OB_HASH_NOT_EXIST != ret) {
LOG_WARN("failed to get history stat", K(ret), K(key));
}
} else {
stream_node->stream_.get_latest_stat(tablet_stat);
}
}
return ret;
}
int ObTenantTabletStatMgr::clear_tablet_stat(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
const ObTabletStatKey key(ls_id, tablet_id);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTenantTabletStatMgr not inited", K(ret));
} else if (OB_UNLIKELY(!key.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("get invalid arguments", K(ret), K(ls_id), K(tablet_id));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, key.hash());
if (OB_FAIL(stream_map_.erase_refactored(key))) {
if (OB_HASH_NOT_EXIST == ret) {
ret = OB_SUCCESS;
} else {
LOG_WARN("failed to erase tablet stat", K(ret), K(key));
}
}
}
return ret;
}
int ObTenantTabletStatMgr::get_all_tablet_stats(
common::ObIArray<ObTabletStat> &tablet_stats)
{
int ret = OB_SUCCESS;
tablet_stats.reset();
ObTabletStreamNode *cur_node = nullptr;
ObTabletStat cur_stat;
for (auto bucket_it = stream_map_.begin(); OB_SUCC(ret) && bucket_it != stream_map_.end(); ++bucket_it) {
if (OB_NOT_NULL(cur_node = bucket_it->second)) {
cur_stat.reset();
cur_node->stream_.get_latest_stat(cur_stat);
if (!cur_stat.is_valid()) {
} else if (0 == cur_stat.query_cnt_ && 0 == cur_stat.merge_cnt_) {
// no tablet stat has been collected in the past 16 minutes.
} else if (OB_FAIL(tablet_stats.push_back(cur_stat))) {
LOG_WARN("failed to add tablet stat", K(ret), K(cur_stat));
}
}
}
return ret;
}
int ObTenantTabletStatMgr::get_history_tablet_stats(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
common::ObIArray<ObTabletStat> &tablet_stats)
{
int ret = OB_SUCCESS;
const ObTabletStatKey key(ls_id, tablet_id);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTenantTabletStatMgr not inited", K(ret));
} else if (OB_UNLIKELY(!key.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("get invalid arguments", K(ret), K(ls_id), K(tablet_id));
} else {
ObTabletStreamNode *stream_node = nullptr;
ObBucketHashRLockGuard lock_guard(bucket_lock_, key.hash());
if (OB_FAIL(stream_map_.get_refactored(key, stream_node))) {
if (OB_HASH_NOT_EXIST != ret) {
LOG_WARN("failed to get history stat", K(ret), K(key));
}
} else if (OB_FAIL(stream_node->stream_.get_all_tablet_stat(tablet_stats))) {
LOG_WARN("failed to get all tablet stat", K(ret), K(key));
}
}
return ret;
}
int ObTenantTabletStatMgr::get_tablet_analyzer(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
ObTabletStatAnalyzer &analyzer)
{
int ret = OB_SUCCESS;
ObTenantSysStat sys_stat;
if (OB_FAIL(get_latest_tablet_stat(ls_id, tablet_id, analyzer.tablet_stat_))) {
if (OB_HASH_NOT_EXIST != ret) {
LOG_WARN("failed to get latest tablet stat", K(ret), K(ls_id), K(tablet_id));
}
} else if (OB_FAIL(get_sys_stat(sys_stat))) {
LOG_WARN("failed to get sys stat", K(ret));
} else {
analyzer.is_small_tenant_ = sys_stat.is_small_tenant();
analyzer.boost_factor_ = analyzer.is_small_tenant_ ? 2 : 1;
}
return ret;
}
int ObTenantTabletStatMgr::get_sys_stat(ObTenantSysStat &sys_stat)
{
int ret = OB_SUCCESS;
if (OB_FAIL(GCTX.omt_->get_tenant_cpu_usage(MTL_ID(), sys_stat.cpu_usage_percentage_))) {
LOG_WARN("failed to get tenant cpu usage", K(ret), K(sys_stat));
} else if (OB_FAIL(GCTX.omt_->get_tenant_cpu(MTL_ID(), sys_stat.min_cpu_cnt_, sys_stat.max_cpu_cnt_))) {
LOG_WARN("failed to get tenant cpu count", K(ret), K(sys_stat));
} else {
sys_stat.memory_hold_ = lib::get_tenant_memory_hold(MTL_ID());
sys_stat.memory_limit_ = lib::get_tenant_memory_limit(MTL_ID());
sys_stat.cpu_usage_percentage_ *= 100 * 100;
}
return ret;
}
int ObTenantTabletStatMgr::update_tablet_stream(const ObTabletStat &report_stat)
{
int ret = OB_SUCCESS;
ObTabletStreamNode *stream_node = nullptr;
ObTabletStatKey key(report_stat.ls_id_, report_stat.tablet_id_);
{
ObBucketHashRLockGuard lock_guard(bucket_lock_, key.hash());
ret = stream_map_.get_refactored(key, stream_node);
}
if (OB_SUCC(ret)) {
} else if (OB_HASH_NOT_EXIST == ret) {
ret = OB_SUCCESS;
if (OB_FAIL(fetch_node(stream_node))) {
LOG_WARN("failed to fetch node from stream pool", K(ret), K(report_stat));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, key.hash());
if (OB_FAIL(stream_map_.set_refactored(key, stream_node))) {
LOG_WARN("failed to update stat map", K(ret), K(report_stat));
}
}
} else {
LOG_WARN("failed to get stream node from stream map", K(ret), K(key));
}
if (OB_SUCC(ret)) {
if (OB_ISNULL(stream_node)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("stream node is unexpected null", K(ret), K(report_stat));
} else if (OB_UNLIKELY(!stream_pool_.update_lru_list(stream_node))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("failed to add node to lru list", K(ret), K(stream_node));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, key.hash());
stream_node->stream_.add_stat(report_stat);
}
}
if (OB_FAIL(ret) && OB_NOT_NULL(stream_node)) {
stream_pool_.remove_lru_list(stream_node);
stream_pool_.free(stream_node);
stream_node = nullptr;
}
return ret;
}
int ObTenantTabletStatMgr::fetch_node(ObTabletStreamNode *&node)
{
int ret = OB_SUCCESS;
bool is_retired = false;
node = nullptr;
if (OB_FAIL(stream_pool_.alloc(node, is_retired))) {
LOG_WARN("failed to alloc node", K(ret));
} else if (is_retired) { // get node from lru_list, should retire the old stat
ObTabletStatKey old_key = node->stream_.get_tablet_stat_key();
ObBucketHashWLockGuard lock_guard(bucket_lock_, old_key.hash());
if (OB_FAIL(stream_map_.erase_refactored(old_key))) {
LOG_WARN("failed to erase tablet stat stream", K(ret), K(old_key));
} else {
node->reset();
}
} else if (OB_UNLIKELY(!stream_pool_.add_lru_list(node))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("failed to add node to lru list", K(ret), KPC(node));
stream_pool_.free(node);
}
if (OB_FAIL(ret) && OB_NOT_NULL(node)) {
node = nullptr;
}
return ret;
}
void ObTenantTabletStatMgr::process_stats()
{
int ret = OB_SUCCESS;
const uint64_t start_idx = report_cursor_;
const uint64_t pending_cur = ATOMIC_LOAD(&pending_cursor_);
uint64_t end_idx = (pending_cur > start_idx + DEFAULT_MAX_PENDING_CNT)
? start_idx + DEFAULT_MAX_PENDING_CNT
: pending_cur;
if (start_idx == end_idx) { // empty queue
} else {
for (uint64_t i = start_idx; i < end_idx; ++i) {
const ObTabletStat &cur_stat = report_queue_[i % DEFAULT_MAX_PENDING_CNT];
if (OB_UNLIKELY(!cur_stat.is_valid())) {
// allow dirty read
} else if (OB_FAIL(update_tablet_stream(cur_stat))) {
LOG_WARN_RET(ret, "failed to update tablet stat", K(ret), K(cur_stat));
}
}
report_cursor_ = pending_cur; // only TabletStatUpdater update this value.
}
}
void ObTenantTabletStatMgr::refresh_all(const int64_t step)
{
ObBucketWLockAllGuard lock_guard(bucket_lock_);
TabletStreamMap::iterator iter = stream_map_.begin();
for ( ; iter != stream_map_.end(); ++iter) {
for (int64_t i = 0; i < step; ++i) {
iter->second->stream_.refresh();
}
}
}
void ObTenantTabletStatMgr::TabletStatUpdater::runTimerTask()
{
mgr_.process_stats();
mgr_.refresh_sys_load();
int64_t interval_step = 0;
if (CHECK_SCHEDULE_TIME_INTERVAL(CHECK_INTERVAL, interval_step)) {
if (OB_UNLIKELY(interval_step > 1)) {
LOG_WARN_RET(OB_ERR_UNEXPECTED, "tablet streams not refresh too long", K(interval_step));
}
mgr_.refresh_all(interval_step);
FLOG_INFO("TenantTabletStatMgr refresh all tablet stream", K(MTL_ID()), K(interval_step));
}
}