/** * Copyright (c) 2023 OceanBase * OceanBase CE is licensed under Mulan PubL v2. * You can use this software according to the terms and conditions of the Mulan PubL v2. * You may obtain a copy of Mulan PubL v2 at: * http://license.coscl.org.cn/MulanPubL-2.0 * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. * See the Mulan PubL v2 for more details. */ #define USING_LOG_PREFIX STORAGE #include "lib/oblog/ob_log_module.h" #include "share/ob_force_print_log.h" #include "share/ob_thread_mgr.h" #include "storage/ob_tenant_tablet_stat_mgr.h" #include "observer/ob_server_struct.h" #include "observer/ob_server.h" #include using namespace oceanbase; using namespace oceanbase::common; using namespace oceanbase::storage; bool ObTransNodeDMLStat::empty() const { return 0 >= insert_row_count_ && 0 >= update_row_count_ && 0 >= delete_row_count_; } void ObTransNodeDMLStat::atomic_inc(const ObTransNodeDMLStat &other) { if (other.empty()) { // do nothing } else { (void) ATOMIC_AAFx(&insert_row_count_, other.insert_row_count_, 0/*placeholder*/); (void) ATOMIC_AAFx(&update_row_count_, other.update_row_count_, 0/*placeholder*/); (void) ATOMIC_AAFx(&delete_row_count_, other.delete_row_count_, 0/*placeholder*/); } } /************************************* ObTabletStatKey *************************************/ ObTabletStatKey::ObTabletStatKey( const int64_t ls_id, const uint64_t tablet_id) : ls_id_(ls_id), tablet_id_(tablet_id) { } ObTabletStatKey::ObTabletStatKey( const share::ObLSID ls_id, const ObTabletID tablet_id) : ls_id_(ls_id), tablet_id_(tablet_id) { } ObTabletStatKey::~ObTabletStatKey() { } void ObTabletStatKey::reset() { ls_id_.reset(); tablet_id_.reset(); } uint64_t ObTabletStatKey::hash() const { uint64_t hash_val = 0; hash_val += ls_id_.hash(); hash_val += tablet_id_.hash(); return hash_val; } int ObTabletStatKey::hash(uint64_t &hash_val) const { hash_val = hash(); return OB_SUCCESS; } bool ObTabletStatKey::is_valid() const { return ls_id_.is_valid() && tablet_id_.is_valid(); } bool ObTabletStatKey::operator==(const ObTabletStatKey &other) const { bool bret = true; if (this == &other) { } else if (ls_id_ != other.ls_id_ || tablet_id_ != other.tablet_id_) { bret = false; } return bret; } bool ObTabletStatKey::operator!=(const ObTabletStatKey &other) const { return !(*this == other); } /************************************* ObTabletStat *************************************/ bool ObTabletStat::is_valid() const { return ls_id_ > 0 && tablet_id_ > 0; } bool ObTabletStat::check_need_report() const { bool bret = false; ObTabletID tablet_id(tablet_id_); if (tablet_id.is_ls_inner_tablet()) { // do nothing } else if (0 < merge_cnt_) { // report by compaction bret = get_total_merge_row_count() >= MERGE_REPORT_MIN_ROW_CNT; } else if (0 < query_cnt_) { // only report the slow query const int64_t boost_factor = tablet_id.is_inner_tablet() ? 2 : 1; if (scan_physical_row_cnt_ > 0 && scan_physical_row_cnt_ >= scan_logical_row_cnt_ * QUERY_REPORT_INEFFICIENT_THRESHOLD * boost_factor) { bret = true; } if (!bret && scan_micro_block_cnt_ > 0 && scan_micro_block_cnt_ >= pushdown_micro_block_cnt_ * QUERY_REPORT_INEFFICIENT_THRESHOLD * boost_factor) { bret = true; } if (!bret && exist_row_total_table_cnt_ > 0 && exist_row_total_table_cnt_ >= exist_row_read_table_cnt_ * QUERY_REPORT_INEFFICIENT_THRESHOLD * boost_factor) { bret = true; } } return bret; } ObTabletStat& ObTabletStat::operator=(const ObTabletStat &other) { if (this != &other) { MEMCPY(this, &other, sizeof(ObTabletStat)); } return *this; } ObTabletStat& ObTabletStat::operator+=(const ObTabletStat &other) { if (other.is_valid()) { ls_id_ = other.ls_id_; tablet_id_ = other.tablet_id_; query_cnt_ += other.query_cnt_; merge_cnt_ += other.merge_cnt_; scan_logical_row_cnt_ += other.scan_logical_row_cnt_; scan_physical_row_cnt_ += other.scan_physical_row_cnt_; scan_micro_block_cnt_ += other.scan_micro_block_cnt_; pushdown_micro_block_cnt_ += other.pushdown_micro_block_cnt_; exist_row_total_table_cnt_ += other.exist_row_total_table_cnt_; exist_row_read_table_cnt_ += other.exist_row_read_table_cnt_; insert_row_cnt_ += other.insert_row_cnt_; update_row_cnt_ += other.update_row_cnt_; delete_row_cnt_ += other.delete_row_cnt_; } return *this; } ObTabletStat& ObTabletStat::archive(int64_t factor) { if (factor > 0) { query_cnt_ /= factor; merge_cnt_ /= factor; scan_logical_row_cnt_ /= factor; scan_physical_row_cnt_ /= factor; scan_micro_block_cnt_ /= factor; pushdown_micro_block_cnt_ /= factor; exist_row_total_table_cnt_ /= factor; exist_row_read_table_cnt_ /= factor; insert_row_cnt_ /= factor; update_row_cnt_ /= factor; delete_row_cnt_ /= factor; } return *this; } /************************************* ObTabletStatAnalyzer *************************************/ ObTabletStatAnalyzer::ObTabletStatAnalyzer() : tablet_stat_(), boost_factor_(1), is_small_tenant_(false) { } bool ObTabletStatAnalyzer::is_hot_tablet() const { return tablet_stat_.query_cnt_ + tablet_stat_.merge_cnt_ >= ACCESS_FREQUENCY * boost_factor_; } bool ObTabletStatAnalyzer::is_insert_mostly() const { bool bret = false; ObTabletID tablet_id(tablet_stat_.tablet_id_); uint64_t total_row_cnt = tablet_stat_.get_total_merge_row_count(); if (tablet_id.is_inner_tablet() || tablet_id.is_ls_inner_tablet()) { // do nothing } else if (0 == tablet_stat_.insert_row_cnt_) { // no insert occurs } else if (total_row_cnt < MERGE_BASIC_ROW_CNT * boost_factor_) { // do nothing } else { bret = total_row_cnt * LOAD_THRESHOLD <= tablet_stat_.insert_row_cnt_ * BASE_FACTOR; } return bret; } bool ObTabletStatAnalyzer::is_update_or_delete_mostly() const { bool bret = false; uint64_t total_row_cnt = tablet_stat_.get_total_merge_row_count(); if (0 == tablet_stat_.delete_row_cnt_ + tablet_stat_.update_row_cnt_) { // no update && delete occurs } else if (total_row_cnt < MERGE_BASIC_ROW_CNT * boost_factor_) { // do nothing } else { bret = total_row_cnt * TOMBSTONE_THRESHOLD * boost_factor_ <= (tablet_stat_.update_row_cnt_ + tablet_stat_.delete_row_cnt_) * BASE_FACTOR; } return bret; } bool ObTabletStatAnalyzer::has_slow_query() const { bool bret = false; // all tablet query stats are ineffecient, only check the basic threshold if (tablet_stat_.scan_physical_row_cnt_ >= QUERY_BASIC_ROW_CNT * boost_factor_ || tablet_stat_.scan_micro_block_cnt_ >= QUERY_BASIC_MICRO_BLOCK_CNT * boost_factor_ || tablet_stat_.exist_row_total_table_cnt_ >= QUERY_BASIC_ITER_TABLE_CNT * boost_factor_) { bret = true; } return bret; } /************************************* ObTenantSysStat *************************************/ ObTenantSysStat::ObTenantSysStat() : cpu_usage_percentage_(0), min_cpu_cnt_(0), max_cpu_cnt_(0), memory_hold_(0), memory_limit_(0) { } void ObTenantSysStat::reset() { cpu_usage_percentage_ = 0; min_cpu_cnt_ = 0; max_cpu_cnt_ = 0; memory_hold_ = 0; memory_limit_ = 0; } bool ObTenantSysStat::is_small_tenant() const { bool bret = false; // 8c16g const int64_t cpu_threshold = 8; // When the tenant memory exceeds 10GB, the meta tenant occupies at least 10% of the memory. const int64_t mem_threshold = (16L << 30) * 9 / 10; bret = max_cpu_cnt_ < cpu_threshold || memory_limit_ < mem_threshold; return bret; } bool ObTenantSysStat::is_full_cpu_usage() const { bool bret = false; if (is_small_tenant()) { bret = 75 <= cpu_usage_percentage_; } else { bret = 85 <= cpu_usage_percentage_; } return bret; } /************************************* ObTabletStream *************************************/ ObTabletStream::ObTabletStream() : key_(), curr_buckets_(CURR_BUCKET_STEP), latest_buckets_(LATEST_BUCKET_STEP), past_buckets_(PAST_BUCKET_STEP) { } ObTabletStream::~ObTabletStream() { } void ObTabletStream::reset() { key_.reset(); curr_buckets_.reset(); latest_buckets_.reset(); past_buckets_.reset(); } void ObTabletStream::add_stat(const ObTabletStat &stat) { if (!key_.is_valid()) { key_.ls_id_ = stat.ls_id_; key_.tablet_id_ = stat.tablet_id_; } if (key_.ls_id_.id() == stat.ls_id_ && key_.tablet_id_.id() == stat.tablet_id_) { curr_buckets_.add(stat); } } void ObTabletStream::refresh() { ObTabletStat tablet_stat; bool has_retired_stat = false; curr_buckets_.refresh(tablet_stat, has_retired_stat); latest_buckets_.refresh(tablet_stat, has_retired_stat); past_buckets_.refresh(tablet_stat, has_retired_stat); } int ObTabletStream::get_all_tablet_stat(common::ObIArray &tablet_stats) const { int ret = OB_SUCCESS; if (OB_FAIL(get_bucket_tablet_stat(curr_buckets_, tablet_stats))) { LOG_WARN("failed to get bucket tablet stat in past bucket", K(ret)); } else if (OB_FAIL(get_bucket_tablet_stat(latest_buckets_, tablet_stats))) { LOG_WARN("failed to get bucket tablet stat in latest bucket", K(ret)); } else if (OB_FAIL(get_bucket_tablet_stat(past_buckets_, tablet_stats))) { LOG_WARN("failed to get bucket tablet stat in curr bucket", K(ret)); } return ret; } /************************************* ObTabletStreamPool *************************************/ ObTabletStreamPool::ObTabletStreamPool() : dynamic_allocator_(MTL_ID()), free_list_allocator_(ObMemAttr(MTL_ID(), "FreeTbltStream")), free_list_(), lru_list_(), max_free_list_num_(0), max_dynamic_node_num_(0), allocated_dynamic_num_(0), is_inited_(false) { } ObTabletStreamPool::~ObTabletStreamPool() { destroy(); } void ObTabletStreamPool::destroy() { is_inited_ = false; ObTabletStreamNode *node = nullptr; DLIST_REMOVE_ALL_NORET(node, lru_list_) { lru_list_.remove(node); if (DYNAMIC_ALLOC == node->flag_) { node->~ObTabletStreamNode(); // ObFIFOAllocator::reset does not release memory by default. dynamic_allocator_.free(node); } else { node->~ObTabletStreamNode(); } node = nullptr; } lru_list_.reset(); while (OB_SUCCESS == free_list_.pop(node)) { if (OB_NOT_NULL(node)) { node->~ObTabletStreamNode(); node = nullptr; } } dynamic_allocator_.reset(); free_list_.destroy(); free_list_allocator_.reset(); } int ObTabletStreamPool::init( const int64_t max_free_list_num, const int64_t max_dynamic_node_num) { int ret = OB_SUCCESS; const char *LABEL = "IncTbltStream"; ObTabletStreamNode *buf = nullptr; if (IS_INIT) { ret = OB_INIT_TWICE; LOG_WARN("ObTabletStreamPool has been inited", K(ret)); } else if (max_free_list_num <= 0 || max_dynamic_node_num < 0) { ret = OB_INVALID_ARGUMENT; LOG_WARN("get invalid argument", K(ret), K(max_free_list_num), K(max_dynamic_node_num)); } else if (OB_FAIL(dynamic_allocator_.init(ObMallocAllocator::get_instance(), OB_MALLOC_NORMAL_BLOCK_SIZE, ObMemAttr(MTL_ID(), LABEL)))) { LOG_WARN("failed to init fifo allocator", K(ret)); } else if (OB_FAIL(free_list_.init(max_free_list_num, &free_list_allocator_))) { LOG_WARN("failed to init free list", K(ret), K(max_free_list_num)); } else if (OB_ISNULL(buf = static_cast(free_list_allocator_.alloc(sizeof(ObTabletStreamNode) * max_free_list_num)))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("failed to allocate memory for stream node in free list", K(ret), K(max_free_list_num)); } else { ObTabletStreamNode *node = nullptr; for (int64_t i = 0; OB_SUCC(ret) && i < max_free_list_num; ++i) { node = new (buf + i) ObTabletStreamNode(FIXED_ALLOC); if (OB_FAIL(free_list_.push(node))) { LOG_WARN("failed to push node to free list", K(ret)); } } if (OB_FAIL(ret)) { destroy(); } else { max_free_list_num_ = max_free_list_num; max_dynamic_node_num_ = max_dynamic_node_num; is_inited_ = true; } } return ret; } int ObTabletStreamPool::alloc(ObTabletStreamNode *&free_node, bool &is_retired) { int ret = OB_SUCCESS; is_retired = false; void *buf = nullptr; // 1. try to alloc node from free_list if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ObTabletStreamPool not inited", K(ret)); } else if (OB_NOT_NULL(free_node)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("get invalid argument", K(ret), K(free_node)); } else if (OB_FAIL(free_list_.pop(free_node))) { if (OB_ENTRY_NOT_EXIST != ret) { LOG_WARN("failed to pop free node from free list", K(ret)); } } // 2. no free node in free_list, try to alloc node dynamically if (OB_ENTRY_NOT_EXIST == ret) { ret = OB_SUCCESS; if (allocated_dynamic_num_ >= max_dynamic_node_num_) { ret = OB_SIZE_OVERFLOW; } else if (OB_ISNULL(buf = dynamic_allocator_.alloc(sizeof(ObTabletStreamNode)))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("failed to allocate memory for free node", K(ret)); } else { free_node = new (buf) ObTabletStreamNode(DYNAMIC_ALLOC); ++allocated_dynamic_num_; } } // 3. dynamic node has reached the upper limit, try to retire the oldest node in lru_list if (OB_SIZE_OVERFLOW == ret) { ret = OB_SUCCESS; if (lru_list_.is_empty()) { ret = OB_ERR_UNEXPECTED; LOG_WARN("lru list is unexpected null", K(ret)); } else { free_node = lru_list_.get_last(); is_retired = true; } } return ret; } void ObTabletStreamPool::free(ObTabletStreamNode *node) { if (OB_NOT_NULL(node)) { int tmp_ret = OB_SUCCESS; if (IS_NOT_INIT) { tmp_ret = OB_NOT_INIT; LOG_ERROR_RET(tmp_ret, "[MEMORY LEAK] ObTabletStreamPool is not inited, cannot free this node!!!", K(tmp_ret), KPC(node)); } else if (DYNAMIC_ALLOC == node->flag_) { node->~ObTabletStreamNode(); dynamic_allocator_.free(node); --allocated_dynamic_num_; } else { node->~ObTabletStreamNode(); OB_ASSERT(OB_SUCCESS == free_list_.push(node)); } } } /************************************* ObTenantSysLoadShedder *************************************/ ObTenantSysLoadShedder::ObTenantSysLoadShedder() { reset(); } void ObTenantSysLoadShedder::reset() { MEMSET(this, 0, sizeof(ObTenantSysLoadShedder)); load_shedding_factor_ = 1; } void ObTenantSysLoadShedder::refresh_sys_load() { if (load_shedding_factor_ > 1 && ObTimeUtility::fast_current_time() < effect_time_ + SHEDDER_EXPIRE_TIME) { // do nothing } else if (REACH_TENANT_TIME_INTERVAL(CPU_TIME_SAMPLING_INTERVAL)) { load_shedding_factor_ = 1; int tmp_ret = OB_SUCCESS; double max_cpu_cnt = 0; double min_cpu_cnt = 0; if (OB_TMP_FAIL(GCTX.omt_->get_tenant_cpu(MTL_ID(), min_cpu_cnt, max_cpu_cnt))) { LOG_WARN_RET(tmp_ret, "failed to get tennant cpu cnt", "tenant_id", MTL_ID()); } else { min_cpu_cnt_ = min_cpu_cnt; max_cpu_cnt_ = max_cpu_cnt; } if (min_cpu_cnt_ > 0 && max_cpu_cnt_ > 0) { (void) refresh_cpu_utility(); } } } int ObTenantSysLoadShedder::refresh_cpu_utility() { int ret = OB_SUCCESS; int64_t curr_cpu_time = last_cpu_time_; int64_t inc_cpu_time = 0; int64_t physical_cpu_utility = 0; if (OB_FAIL(GCTX.omt_->get_tenant_cpu_time(MTL_ID(), curr_cpu_time))) { LOG_WARN("failed to get tennant cpu cnt", K(ret)); } else { const int64_t curr_sample_time = ObTimeUtility::fast_current_time(); if (0 == last_sample_time_ || 0 == last_cpu_time_) { // first time sample, no need to calculate cpu utility } else { inc_cpu_time = curr_cpu_time - last_cpu_time_; physical_cpu_utility = inc_cpu_time * 100 / (curr_sample_time - last_sample_time_); } if (physical_cpu_utility > max_cpu_cnt_ * 100) { ret = OB_ERR_UNEXPECTED; LOG_WARN("cpu utility unexpected bigger than cpu cnt", K(ret), K(max_cpu_cnt_), K(physical_cpu_utility), K(inc_cpu_time), K(curr_sample_time), K(last_sample_time_)); } else if (physical_cpu_utility >= max_cpu_cnt_ * 100 * CPU_TIME_THRESHOLD) { ATOMIC_STORE(&load_shedding_factor_, DEFAULT_LOAD_SHEDDING_FACTOR); effect_time_ = ObTimeUtility::fast_current_time(); FLOG_INFO("[ADAPTIVE_SCHED] refresh cpu utility", K(ret), K(load_shedding_factor_), K(max_cpu_cnt_), K(physical_cpu_utility), K(inc_cpu_time), K(curr_sample_time), K(last_sample_time_), K(curr_cpu_time), K(last_cpu_time_)); } last_sample_time_ = curr_sample_time; last_cpu_time_ = curr_cpu_time; } return ret; } /************************************* ObTenantTabletStatMgr *************************************/ ObTenantTabletStatMgr::ObTenantTabletStatMgr() : report_stat_task_(*this), stream_pool_(), stream_map_(), bucket_lock_(), report_queue_(), load_shedder_(), report_cursor_(0), pending_cursor_(0), report_tg_id_(0), is_inited_(false) { } ObTenantTabletStatMgr::~ObTenantTabletStatMgr() { destroy(); } int ObTenantTabletStatMgr::init(const int64_t tenant_id) { int ret = OB_SUCCESS; const bool repeat = true; int64_t bucket_num = DEFAULT_BUCKET_NUM; if (IS_INIT) { ret = OB_INIT_TWICE; LOG_WARN("ObTenantTabletStatMgr init twice", K(ret)); } else if (OB_FAIL(stream_pool_.init(DEFAULT_MAX_FREE_STREAM_CNT, DEFAULT_UP_LIMIT_STREAM_CNT))) { LOG_WARN("failed to init tablet stream pool", K(ret)); } else if (OB_FAIL(stream_map_.create(DEFAULT_BUCKET_NUM, ObMemAttr(tenant_id, "TabletStats")))) { LOG_WARN("failed to create TabletStats", K(ret)); } else if (FALSE_IT(bucket_num = stream_map_.bucket_count())) { } else if (OB_FAIL(bucket_lock_.init(bucket_num, ObLatchIds::DEFAULT_BUCKET_LOCK, ObMemAttr(tenant_id, "TabStatMgrLock")))) { LOG_WARN("failed to init bucket lock", K(ret)); } else if (OB_FAIL(TG_CREATE_TENANT(lib::TGDefIDs::TabletStatRpt, report_tg_id_))) { LOG_WARN("failed to create TabletStatRpt thread", K(ret)); } else if (OB_FAIL(TG_START(report_tg_id_))) { LOG_WARN("failed to start stat TabletStatRpt thread", K(ret)); } else if (OB_FAIL(TG_SCHEDULE(report_tg_id_, report_stat_task_, TABLET_STAT_PROCESS_INTERVAL, repeat))) { LOG_WARN("failed to schedule tablet stat update task", K(ret)); } else { load_shedder_.refresh_sys_load(); is_inited_ = true; } if (!is_inited_) { reset(); } return ret; } int ObTenantTabletStatMgr::mtl_init(ObTenantTabletStatMgr* &tablet_stat_mgr) { int ret = OB_SUCCESS; if (OB_FAIL(tablet_stat_mgr->init(MTL_ID()))) { LOG_WARN("failed to init tablet stat mgr", K(ret), K(MTL_ID())); } else { LOG_INFO("success to init ObTenantTabletStatMgr", K(MTL_ID())); } return ret; } void ObTenantTabletStatMgr::wait() { TG_WAIT(report_tg_id_); } void ObTenantTabletStatMgr::stop() { TG_STOP(report_tg_id_); } void ObTenantTabletStatMgr::destroy() { if (IS_INIT) { reset(); } } void ObTenantTabletStatMgr::reset() { stop(); wait(); TG_DESTROY(report_tg_id_); { ObBucketWLockAllGuard lock_guard(bucket_lock_); stream_map_.destroy(); stream_pool_.destroy(); report_cursor_ = 0; pending_cursor_ = 0; report_tg_id_ = 0; is_inited_ = false; } bucket_lock_.destroy(); load_shedder_.reset(); FLOG_INFO("ObTenantTabletStatMgr destroyed!"); } int ObTenantTabletStatMgr::report_stat( const ObTabletStat &stat, bool &succ_report) { int ret = OB_SUCCESS; succ_report = false; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ObTenantTabletStatMgr not inited", K(ret)); } else if (OB_UNLIKELY(!stat.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("get invalid arguments", K(ret), K(stat)); } else if (!stat.check_need_report()) { } else { uint64_t pending_cur = pending_cursor_; if (pending_cur - report_cursor_ >= DEFAULT_MAX_PENDING_CNT) { // first check full queue with dirty read if (REACH_TENANT_TIME_INTERVAL(10 * 1000L * 1000L/*10s*/)) { LOG_INFO("report_queue is full, wait to process", K(report_cursor_), K(pending_cur), K(stat)); } } else if (FALSE_IT(pending_cur = ATOMIC_FAA(&pending_cursor_, 1))) { } else if (pending_cur - report_cursor_ >= DEFAULT_MAX_PENDING_CNT) { // double check if (REACH_TENANT_TIME_INTERVAL(10 * 1000L * 1000L/*10s*/)) { LOG_INFO("report_queue is full, wait to process", K(report_cursor_), K(pending_cur), K(stat)); } } else { report_queue_[pending_cur % DEFAULT_MAX_PENDING_CNT] = stat; succ_report = true; } } return ret; } int ObTenantTabletStatMgr::get_latest_tablet_stat( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, ObTabletStat &tablet_stat) { int ret = OB_SUCCESS; tablet_stat.reset(); tablet_stat.ls_id_ = ls_id.id(); tablet_stat.tablet_id_ = tablet_id.id(); const ObTabletStatKey key(ls_id, tablet_id); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ObTenantTabletStatMgr not inited", K(ret)); } else if (OB_UNLIKELY(!key.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("get invalid arguments", K(ret), K(ls_id), K(tablet_id)); } else { ObTabletStreamNode *stream_node = nullptr; ObBucketHashRLockGuard lock_guard(bucket_lock_, key.hash()); if (OB_FAIL(stream_map_.get_refactored(key, stream_node))) { if (OB_HASH_NOT_EXIST != ret) { LOG_WARN("failed to get history stat", K(ret), K(key)); } } else { stream_node->stream_.get_latest_stat(tablet_stat); } } return ret; } int ObTenantTabletStatMgr::clear_tablet_stat( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; const ObTabletStatKey key(ls_id, tablet_id); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ObTenantTabletStatMgr not inited", K(ret)); } else if (OB_UNLIKELY(!key.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("get invalid arguments", K(ret), K(ls_id), K(tablet_id)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, key.hash()); if (OB_FAIL(stream_map_.erase_refactored(key))) { if (OB_HASH_NOT_EXIST == ret) { ret = OB_SUCCESS; } else { LOG_WARN("failed to erase tablet stat", K(ret), K(key)); } } } return ret; } int ObTenantTabletStatMgr::get_all_tablet_stats( common::ObIArray &tablet_stats) { int ret = OB_SUCCESS; tablet_stats.reset(); ObTabletStreamNode *cur_node = nullptr; ObTabletStat cur_stat; for (auto bucket_it = stream_map_.begin(); OB_SUCC(ret) && bucket_it != stream_map_.end(); ++bucket_it) { if (OB_NOT_NULL(cur_node = bucket_it->second)) { cur_stat.reset(); cur_node->stream_.get_latest_stat(cur_stat); if (!cur_stat.is_valid()) { } else if (0 == cur_stat.query_cnt_ && 0 == cur_stat.merge_cnt_) { // no tablet stat has been collected in the past 16 minutes. } else if (OB_FAIL(tablet_stats.push_back(cur_stat))) { LOG_WARN("failed to add tablet stat", K(ret), K(cur_stat)); } } } return ret; } int ObTenantTabletStatMgr::get_history_tablet_stats( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, common::ObIArray &tablet_stats) { int ret = OB_SUCCESS; const ObTabletStatKey key(ls_id, tablet_id); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ObTenantTabletStatMgr not inited", K(ret)); } else if (OB_UNLIKELY(!key.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("get invalid arguments", K(ret), K(ls_id), K(tablet_id)); } else { ObTabletStreamNode *stream_node = nullptr; ObBucketHashRLockGuard lock_guard(bucket_lock_, key.hash()); if (OB_FAIL(stream_map_.get_refactored(key, stream_node))) { if (OB_HASH_NOT_EXIST != ret) { LOG_WARN("failed to get history stat", K(ret), K(key)); } } else if (OB_FAIL(stream_node->stream_.get_all_tablet_stat(tablet_stats))) { LOG_WARN("failed to get all tablet stat", K(ret), K(key)); } } return ret; } int ObTenantTabletStatMgr::get_tablet_analyzer( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, ObTabletStatAnalyzer &analyzer) { int ret = OB_SUCCESS; ObTenantSysStat sys_stat; if (OB_FAIL(get_latest_tablet_stat(ls_id, tablet_id, analyzer.tablet_stat_))) { if (OB_HASH_NOT_EXIST != ret) { LOG_WARN("failed to get latest tablet stat", K(ret), K(ls_id), K(tablet_id)); } } else if (OB_FAIL(get_sys_stat(sys_stat))) { LOG_WARN("failed to get sys stat", K(ret)); } else { analyzer.is_small_tenant_ = sys_stat.is_small_tenant(); analyzer.boost_factor_ = analyzer.is_small_tenant_ ? 2 : 1; } return ret; } int ObTenantTabletStatMgr::get_sys_stat(ObTenantSysStat &sys_stat) { int ret = OB_SUCCESS; if (OB_FAIL(GCTX.omt_->get_tenant_cpu_usage(MTL_ID(), sys_stat.cpu_usage_percentage_))) { LOG_WARN("failed to get tenant cpu usage", K(ret), K(sys_stat)); } else if (OB_FAIL(GCTX.omt_->get_tenant_cpu(MTL_ID(), sys_stat.min_cpu_cnt_, sys_stat.max_cpu_cnt_))) { LOG_WARN("failed to get tenant cpu count", K(ret), K(sys_stat)); } else { sys_stat.memory_hold_ = lib::get_tenant_memory_hold(MTL_ID()); sys_stat.memory_limit_ = lib::get_tenant_memory_limit(MTL_ID()); sys_stat.cpu_usage_percentage_ *= 100 * 100; } return ret; } int ObTenantTabletStatMgr::update_tablet_stream(const ObTabletStat &report_stat) { int ret = OB_SUCCESS; ObTabletStreamNode *stream_node = nullptr; ObTabletStatKey key(report_stat.ls_id_, report_stat.tablet_id_); { ObBucketHashRLockGuard lock_guard(bucket_lock_, key.hash()); ret = stream_map_.get_refactored(key, stream_node); } if (OB_SUCC(ret)) { } else if (OB_HASH_NOT_EXIST == ret) { ret = OB_SUCCESS; if (OB_FAIL(fetch_node(stream_node))) { LOG_WARN("failed to fetch node from stream pool", K(ret), K(report_stat)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, key.hash()); if (OB_FAIL(stream_map_.set_refactored(key, stream_node))) { LOG_WARN("failed to update stat map", K(ret), K(report_stat)); } } } else { LOG_WARN("failed to get stream node from stream map", K(ret), K(key)); } if (OB_SUCC(ret)) { if (OB_ISNULL(stream_node)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("stream node is unexpected null", K(ret), K(report_stat)); } else if (OB_UNLIKELY(!stream_pool_.update_lru_list(stream_node))) { ret = OB_ERR_UNEXPECTED; LOG_WARN("failed to add node to lru list", K(ret), K(stream_node)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, key.hash()); stream_node->stream_.add_stat(report_stat); } } if (OB_FAIL(ret) && OB_NOT_NULL(stream_node)) { stream_pool_.remove_lru_list(stream_node); stream_pool_.free(stream_node); stream_node = nullptr; } return ret; } int ObTenantTabletStatMgr::fetch_node(ObTabletStreamNode *&node) { int ret = OB_SUCCESS; bool is_retired = false; node = nullptr; if (OB_FAIL(stream_pool_.alloc(node, is_retired))) { LOG_WARN("failed to alloc node", K(ret)); } else if (is_retired) { // get node from lru_list, should retire the old stat ObTabletStatKey old_key = node->stream_.get_tablet_stat_key(); ObBucketHashWLockGuard lock_guard(bucket_lock_, old_key.hash()); if (OB_FAIL(stream_map_.erase_refactored(old_key))) { LOG_WARN("failed to erase tablet stat stream", K(ret), K(old_key)); } else { node->reset(); } } else if (OB_UNLIKELY(!stream_pool_.add_lru_list(node))) { ret = OB_ERR_UNEXPECTED; LOG_WARN("failed to add node to lru list", K(ret), KPC(node)); stream_pool_.free(node); } if (OB_FAIL(ret) && OB_NOT_NULL(node)) { node = nullptr; } return ret; } void ObTenantTabletStatMgr::process_stats() { int ret = OB_SUCCESS; const uint64_t start_idx = report_cursor_; const uint64_t pending_cur = ATOMIC_LOAD(&pending_cursor_); uint64_t end_idx = (pending_cur > start_idx + DEFAULT_MAX_PENDING_CNT) ? start_idx + DEFAULT_MAX_PENDING_CNT : pending_cur; if (start_idx == end_idx) { // empty queue } else { for (uint64_t i = start_idx; i < end_idx; ++i) { const ObTabletStat &cur_stat = report_queue_[i % DEFAULT_MAX_PENDING_CNT]; if (OB_UNLIKELY(!cur_stat.is_valid())) { // allow dirty read } else if (OB_FAIL(update_tablet_stream(cur_stat))) { LOG_WARN_RET(ret, "failed to update tablet stat", K(ret), K(cur_stat)); } } report_cursor_ = pending_cur; // only TabletStatUpdater update this value. } } void ObTenantTabletStatMgr::refresh_all(const int64_t step) { ObBucketWLockAllGuard lock_guard(bucket_lock_); TabletStreamMap::iterator iter = stream_map_.begin(); for ( ; iter != stream_map_.end(); ++iter) { for (int64_t i = 0; i < step; ++i) { iter->second->stream_.refresh(); } } } void ObTenantTabletStatMgr::TabletStatUpdater::runTimerTask() { mgr_.process_stats(); mgr_.refresh_sys_load(); int64_t interval_step = 0; if (CHECK_SCHEDULE_TIME_INTERVAL(CHECK_INTERVAL, interval_step)) { if (OB_UNLIKELY(interval_step > 1)) { LOG_WARN_RET(OB_ERR_UNEXPECTED, "tablet streams not refresh too long", K(interval_step)); } mgr_.refresh_all(interval_step); FLOG_INFO("TenantTabletStatMgr refresh all tablet stream", K(MTL_ID()), K(interval_step)); } }