Files
oceanbase/src/storage/compaction/ob_tenant_medium_checker.cpp
2024-02-06 23:10:57 +00:00

375 lines
13 KiB
C++

/**
* Copyright (c) 2023 OceanBase
* OceanBase is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX STORAGE_COMPACTION
#include "storage/compaction/ob_tenant_medium_checker.h"
#include "storage/compaction/ob_medium_compaction_func.h"
#include "storage/compaction/ob_compaction_diagnose.h"
#include "storage/compaction/ob_server_compaction_event_history.h"
#include "storage/compaction/ob_tablet_merge_ctx.h"
#include "storage/ls/ob_ls.h"
#include "storage/tablet/ob_tablet.h"
#include "storage/tx_storage/ob_ls_service.h"
namespace oceanbase
{
using namespace storage;
namespace compaction
{
/*
* ObTabletCheckInfo implement
* */
bool ObTabletCheckInfo::is_valid() const
{
return tablet_id_.is_valid() && ls_id_.is_valid() &&
check_medium_scn_ != 0;
}
uint64_t ObTabletCheckInfo::hash() const
{
uint64_t hash_val = 0;
hash_val = murmurhash(&tablet_id_, sizeof(tablet_id_), hash_val);
hash_val = murmurhash(&ls_id_, sizeof(ls_id_), hash_val);
return hash_val;
}
bool ObTabletCheckInfo::operator==(const ObTabletCheckInfo &other) const
{
return tablet_id_ == other.tablet_id_ &&
ls_id_ == other.ls_id_;
}
/*
* ObBatchFinishCheckStat implement
* */
int64_t ObBatchFinishCheckStat::to_string(char *buf, const int64_t buf_len) const
{
int ret = OB_SUCCESS;
int64_t pos = 0;
J_OBJ_START();
J_KV(K_(succ_cnt), K_(finish_cnt), K_(fail_cnt), K_(filter_cnt));
if (0 != fail_cnt_) {
J_COMMA();
J_KV(K_(failed_info));
}
J_OBJ_END();
return pos;
}
/*
* ObTenantMediumChecker implement
* */
int ObTenantMediumChecker::mtl_init(ObTenantMediumChecker *&tablet_medium_checker)
{
return tablet_medium_checker->init();
}
ObTenantMediumChecker::ObTenantMediumChecker()
: is_inited_(false),
last_check_timestamp_(0),
ls_locality_cache_(),
tablet_ls_set_(),
ls_info_map_(),
lock_()
{}
ObTenantMediumChecker::~ObTenantMediumChecker()
{
destroy();
}
int ObTenantMediumChecker::init()
{
int ret = OB_SUCCESS;
if (OB_FAIL(ls_locality_cache_.init(MTL_ID()))) {
LOG_WARN("failed to init ls locality cache", K(ret));
} else if (OB_FAIL(tablet_ls_set_.create(DEFAULT_MAP_BUCKET, "MedCheckSet", "CheckSetNode", MTL_ID()))) {
LOG_WARN("failed to create set", K(ret));
} else if (OB_FAIL(ls_info_map_.create(OB_MAX_LS_NUM_PER_TENANT_PER_SERVER, "MedCheckMap", "CheckMapNode", MTL_ID()))) {
LOG_WARN("failed to create map", K(ret));
} else {
is_inited_ = true;
}
if (!is_inited_) {
destroy();
}
return ret;
}
void ObTenantMediumChecker::destroy()
{
is_inited_ = false;
ls_locality_cache_.destroy();
if (tablet_ls_set_.created()) {
tablet_ls_set_.destroy();
}
if (ls_info_map_.created()) {
ls_info_map_.destroy();
}
}
int ObTenantMediumChecker::refresh_ls_status()
{
int ret = OB_SUCCESS;
int tmp_ret = OB_SUCCESS;
lib::ObMutexGuard guard(lock_);
if (OB_TMP_FAIL(ls_locality_cache_.refresh_ls_locality(true/*force_refresh*/))) {
LOG_WARN("failed to refresh ls locality", K(tmp_ret));
}
common::ObSEArray<share::ObLSID, LS_ID_ARRAY_CNT> ls_ids;
if (OB_FAIL(MTL(ObLSService *)->get_ls_ids(ls_ids))) {
LOG_WARN("failed to get all ls id", K(ret));
} else {
ls_info_map_.reuse();
for (int64_t i = 0; i < ls_ids.count(); ++i) {
const ObLSID &ls_id = ls_ids[i];
ObLSInfo ls_info;
bool is_election_leader = false;
if (OB_TMP_FAIL(ObMediumCompactionScheduleFunc::is_election_leader(ls_id, is_election_leader))) {
if (OB_LS_NOT_EXIST != tmp_ret) {
LOG_WARN("failed to get palf handle role", K(tmp_ret), K(ls_id));
}
} else if (is_election_leader) {
if (OB_TMP_FAIL(ls_locality_cache_.get_ls_info(ls_id, ls_info))) {
if (OB_HASH_NOT_EXIST != tmp_ret) {
LOG_WARN("failed to get ls locality", K(tmp_ret), K(ls_id));
}
} else if (OB_TMP_FAIL(ls_info_map_.set_refactored(ls_id, ls_info))) {
LOG_WARN("fail to set map", K(ret), K(ls_id));
}
}
}
}
return ret;
}
int ObTenantMediumChecker::check_ls_status(const share::ObLSID &ls_id, bool &is_leader, bool need_check)
{
int ret = OB_SUCCESS;
int tmp_ret = OB_SUCCESS;
is_leader = false;
if (need_check
&& CHECK_LS_LOCALITY_INTERVAL < ObTimeUtility::fast_current_time() - last_check_timestamp_) {
if (OB_TMP_FAIL(refresh_ls_status())) {
LOG_WARN("failed to refresh ls locality", K(tmp_ret));
} else {
last_check_timestamp_ = ObTimeUtility::fast_current_time();
}
}
lib::ObMutexGuard guard(lock_);
ObLSInfo ls_info;
if (OB_FAIL(ls_info_map_.get_refactored(ls_id, ls_info))) {
if (OB_HASH_NOT_EXIST != ret) {
LOG_WARN("fail to get map", K(ret), K(ls_id));
} else {
ret = OB_SUCCESS;
}
} else {
is_leader = true;
}
return ret;
}
int ObTenantMediumChecker::add_tablet_ls(const ObTabletID &tablet_id, const share::ObLSID &ls_id, const int64_t medium_scn)
{
int ret = OB_SUCCESS;
int tmp_ret = OB_SUCCESS;
bool is_leader = false;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTenantMediumChecker is not inited", K(ret));
} else if (!tablet_id.is_valid() || !ls_id.is_valid() || 0 == medium_scn) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(tablet_id), K(ls_id), K(medium_scn));
} else if (OB_FAIL(check_ls_status(ls_id, is_leader, true/*need force check role*/))) {
LOG_WARN("fail to check ls status", K(ret), K(ls_id));
} else if (is_leader) {
lib::ObMutexGuard guard(lock_);
// just cover the old info
if (OB_FAIL(tablet_ls_set_.set_refactored(ObTabletCheckInfo(tablet_id, ls_id, medium_scn)))) {
LOG_WARN("failed to set tablet_ls_info", K(ret), K(ls_id), K(tablet_id));
}
}
return ret;
}
bool ObTenantMediumChecker::locality_cache_empty()
{
bool ret = true;
if (IS_INIT) {
lib::ObMutexGuard guard(lock_);
ret = ls_locality_cache_.empty();
}
return ret;
}
int ObTenantMediumChecker::check_medium_finish_schedule()
{
int ret = OB_SUCCESS;
int tmp_ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTenantMediumChecker is not inited", K(ret));
} else {
// refresh ls locality cache
if (OB_TMP_FAIL(ls_locality_cache_.refresh_ls_locality(false /*force_refresh*/))) {
LOG_WARN("failed to refresh ls locality", K(tmp_ret));
ADD_COMMON_SUSPECT_INFO(MEDIUM_MERGE, share::ObDiagnoseTabletType::TYPE_MEDIUM_MERGE,
SUSPECT_FAILED_TO_REFRESH_LS_LOCALITY, tmp_ret);
} else {
DEL_SUSPECT_INFO(MEDIUM_MERGE, UNKNOW_LS_ID, UNKNOW_TABLET_ID, ObDiagnoseTabletType::TYPE_MEDIUM_MERGE);
}
TabletLSArray tablet_ls_infos;
tablet_ls_infos.set_attr(ObMemAttr(MTL_ID(), "CheckInfos"));
TabletLSArray batch_tablet_ls_infos;
batch_tablet_ls_infos.set_attr(ObMemAttr(MTL_ID(), "BCheckInfos"));
TabletLSArray finish_tablet_ls_infos;
finish_tablet_ls_infos.set_attr(ObMemAttr(MTL_ID(), "FinishInfos"));
// copy the tablet_ls_infos from set // with lock
{
lib::ObMutexGuard guard(lock_);
if (OB_FAIL(tablet_ls_infos.reserve(tablet_ls_set_.size()))) {
LOG_WARN("fail to reserve array", K(ret), "size", tablet_ls_set_.size());
} else {
for (TabletLSSet::const_iterator iter = tablet_ls_set_.begin();
OB_SUCC(ret) && iter != tablet_ls_set_.end(); ++iter) {
if (OB_FAIL(tablet_ls_infos.push_back(iter->first))) {
LOG_WARN("failed to push back tablet_ls_info", K(ret), K(iter->first));
}
}
}
if (OB_SUCC(ret)) {
tablet_ls_set_.clear();
}
}
const int64_t batch_size = MTL(ObTenantTabletScheduler *)->get_checker_batch_size();
if (OB_FAIL(ret) || tablet_ls_infos.empty()) {
} else if (OB_FAIL(batch_tablet_ls_infos.reserve(batch_size))) {
LOG_WARN("fail to reserve array", K(ret), "size", batch_size);
} else if (OB_FAIL(finish_tablet_ls_infos.reserve(batch_size))) {
LOG_WARN("fail to reserve array", K(ret), "size", batch_size);
} else {
// batch check
int64_t info_count = tablet_ls_infos.count();
int64_t start_idx = 0;
int64_t end_idx = min(batch_size, info_count);
int64_t cost_ts = ObTimeUtility::fast_current_time();
ObBatchFinishCheckStat stat;
while (start_idx < end_idx) {
if (OB_TMP_FAIL(check_medium_finish(tablet_ls_infos, start_idx, end_idx, batch_tablet_ls_infos, finish_tablet_ls_infos, stat))) {
LOG_WARN("failed to check medium finish", K(tmp_ret));
}
start_idx = end_idx;
end_idx = min(start_idx + batch_size, info_count);
}
cost_ts = ObTimeUtility::fast_current_time() - cost_ts;
ADD_COMPACTION_EVENT(
MTL(ObTenantTabletScheduler*)->get_frozen_version(),
ObServerCompactionEvent::COMPACTION_FINISH_CHECK,
ObTimeUtility::fast_current_time(),
K(cost_ts), "batch_check_stat", stat);
}
}
return ret;
}
int ObTenantMediumChecker::check_medium_finish(
const ObIArray<ObTabletCheckInfo> &tablet_ls_infos,
int64_t start_idx,
int64_t end_idx,
ObIArray<ObTabletCheckInfo> &check_tablet_ls_infos,
ObIArray<ObTabletCheckInfo> &finish_tablet_ls_infos,
ObBatchFinishCheckStat &stat)
{
int ret = OB_SUCCESS;
int tmp_ret = OB_SUCCESS;
if (OB_UNLIKELY(tablet_ls_infos.empty()
|| start_idx < 0
|| start_idx >= end_idx
|| end_idx > tablet_ls_infos.count())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", KR(ret), K(tablet_ls_infos), K(start_idx), K(end_idx));
} else {
check_tablet_ls_infos.reuse();
finish_tablet_ls_infos.reuse();
for (int64_t i = start_idx; OB_SUCC(ret) && i < end_idx; ++i) {
const ObLSID &ls_id = tablet_ls_infos.at(i).get_ls_id();
bool is_leader = false;
if (OB_UNLIKELY(0 == tablet_ls_infos.at(i).get_medium_scn())) {
tmp_ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected medium scn", K(tmp_ret), K(tablet_ls_infos.at(i)));
} else if (OB_TMP_FAIL(check_ls_status(ls_id, is_leader, false/*no need force check role*/))) {
LOG_WARN("fail to check ls status", K(tmp_ret), K(ls_id));
} else if (is_leader) {
if (OB_FAIL(check_tablet_ls_infos.push_back(tablet_ls_infos.at(i)))) {
LOG_WARN("fail to push back check_tablet_ls_infos", K(ret), K(tablet_ls_infos.at(i)));
}
}
}
ObCompactionScheduleTimeGuard time_guard;
stat.filter_cnt_ += (end_idx - start_idx - check_tablet_ls_infos.count());
if (FAILEDx(ObMediumCompactionScheduleFunc::batch_check_medium_finish(
ls_info_map_, finish_tablet_ls_infos, check_tablet_ls_infos, time_guard))) {
LOG_WARN("failed to batch check medium finish", K(ret), K(tablet_ls_infos.count()), K(check_tablet_ls_infos.count()),
K(tablet_ls_infos), K(check_tablet_ls_infos));
stat.fail_cnt_ += check_tablet_ls_infos.count();
if (0 != stat.fail_cnt_) {
stat.failed_info_ = check_tablet_ls_infos.at(0);
}
if (OB_TMP_FAIL(reput_check_info(check_tablet_ls_infos))) {
LOG_WARN("fail to reput failed check infos", K(tmp_ret));
}
} else {
LOG_INFO("success to check medium finish", K(ret), K(tablet_ls_infos.count()), K(check_tablet_ls_infos.count()),
K(finish_tablet_ls_infos.count()), K(tablet_ls_infos), K(check_tablet_ls_infos), K(finish_tablet_ls_infos));
stat.succ_cnt_ += check_tablet_ls_infos.count();
stat.finish_cnt_ += finish_tablet_ls_infos.count();
if (OB_FAIL(MTL(ObTenantTabletScheduler*)->schedule_next_round_for_leader(check_tablet_ls_infos, finish_tablet_ls_infos))) {
LOG_WARN("failed to leader schedule", K(ret));
} else {
time_guard.click(ObCompactionScheduleTimeGuard::SCHEDULER_NEXT_ROUND);
}
}
LOG_INFO("finish medium check", K(ret), K(start_idx), K(end_idx),
K(check_tablet_ls_infos.count()), K(finish_tablet_ls_infos.count()), K(time_guard));
}
return ret;
}
// just reput into set without ls status check
int ObTenantMediumChecker::reput_check_info(ObIArray<ObTabletCheckInfo> &tablet_ls_infos)
{
int ret = OB_SUCCESS;
int tmp_ret = OB_SUCCESS;
bool is_leader = false;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ObTenantMediumChecker is not inited", K(ret));
} else {
lib::ObMutexGuard guard(lock_);
for (int64_t i = 0; OB_SUCC(ret) && i < tablet_ls_infos.count(); ++i) {
const ObTabletCheckInfo &check_info = tablet_ls_infos.at(i);
if (OB_HASH_EXIST == (tmp_ret = tablet_ls_set_.exist_refactored(check_info))) {
ret = OB_SUCCESS; // tablet exist
} else if (OB_UNLIKELY(OB_HASH_NOT_EXIST != tmp_ret)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("failed to check exist in tablet set", K(ret), K(tmp_ret), K(check_info));
} else if (OB_TMP_FAIL(tablet_ls_set_.set_refactored(check_info))) {
LOG_WARN("failed to set tablet_ls_info", K(tmp_ret), K(check_info));
}
}
}
return ret;
}
}
}