/** * Copyright (c) 2021 OceanBase * OceanBase CE is licensed under Mulan PubL v2. * You can use this software according to the terms and conditions of the Mulan PubL v2. * You may obtain a copy of Mulan PubL v2 at: * http://license.coscl.org.cn/MulanPubL-2.0 * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. * See the Mulan PubL v2 for more details. */ #define USING_LOG_PREFIX STORAGE #include "storage/ls/ob_ls.h" #include "storage/checkpoint/ob_checkpoint_executor.h" #include "storage/tx_storage/ob_checkpoint_service.h" #include "storage/checkpoint/ob_data_checkpoint.h" #include "share/ob_force_print_log.h" #include "logservice/ob_log_base_type.h" namespace oceanbase { using namespace share; using namespace logservice; namespace storage { namespace checkpoint { ObCheckpointExecutor::ObCheckpointExecutor() : rwlock_(common::ObLatchIds::CLOG_CKPT_RWLOCK), update_checkpoint_enabled_(false), reuse_recycle_scn_times_(0), prev_clog_checkpoint_lsn_(), prev_recycle_scn_() { reset(); } ObCheckpointExecutor::~ObCheckpointExecutor() { reset(); } void ObCheckpointExecutor::reset() { for (int i = 0; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) { handlers_[i] = NULL; } ls_ = NULL; loghandler_ = NULL; reuse_recycle_scn_times_ = 0; prev_clog_checkpoint_lsn_.reset(); prev_recycle_scn_.set_invalid(); } int ObCheckpointExecutor::register_handler(const ObLogBaseType &type, ObICheckpointSubHandler *handler) { int ret = OB_SUCCESS; if (!is_valid_log_base_type(type) || NULL == handler) { ret = OB_INVALID_ARGUMENT; STORAGE_LOG(WARN, "invalid arguments", K(ret), K(type), K(handler)); } else { if (OB_NOT_NULL(handlers_[type])) { STORAGE_LOG(WARN, "repeat register into checkpoint_executor", K(ret), K(type), K(handler)); } else { handlers_[type] = handler; } } return ret; } void ObCheckpointExecutor::unregister_handler(const ObLogBaseType &type) { int ret = OB_SUCCESS; if (!is_valid_log_base_type(type)) { ret = OB_INVALID_ARGUMENT; STORAGE_LOG(WARN, "invalid arguments", K(ret), K(type)); } else { handlers_[type] = NULL; } } int ObCheckpointExecutor::init(ObLS *ls, ObILogHandler *loghandler) { int ret = OB_SUCCESS; ls_ = ls; loghandler_ = loghandler; return ret; } void ObCheckpointExecutor::start() { online(); } void ObCheckpointExecutor::online() { WLockGuard guard(rwlock_); update_checkpoint_enabled_ = true; } void ObCheckpointExecutor::offline() { WLockGuard guard(rwlock_); update_checkpoint_enabled_ = false; } void ObCheckpointExecutor::get_min_rec_scn(int &log_type, SCN &min_rec_scn) const { for (int i = 1; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) { if (OB_NOT_NULL(handlers_[i])) { SCN rec_scn = handlers_[i]->get_rec_scn(); if (rec_scn > SCN::min_scn() && rec_scn < min_rec_scn) { min_rec_scn = rec_scn; log_type = i; } } } } inline void get_min_rec_scn_service_type_by_index_(int index, char* service_type) { int ret = OB_SUCCESS; if (index == 0) { strncpy(service_type ,"MAX_DECIDED_SCN", common::MAX_SERVICE_TYPE_BUF_LENGTH); } else if (OB_FAIL(log_base_type_to_string(ObLogBaseType(index), service_type, common::MAX_SERVICE_TYPE_BUF_LENGTH))) { STORAGE_LOG(WARN, "log_base_type_to_string failed", K(ret), K(index)); strncpy(service_type ,"UNKNOWN_SERVICE_TYPE", common::MAX_SERVICE_TYPE_BUF_LENGTH); } } int ObCheckpointExecutor::update_clog_checkpoint() { int ret = OB_SUCCESS; WLockGuard guard_for_update_clog_checkpoint(rwlock_for_update_clog_checkpoint_); RLockGuard guard(rwlock_); if (update_checkpoint_enabled_) { ObFreezer *freezer = ls_->get_freezer(); if (OB_NOT_NULL(freezer)) { SCN checkpoint_scn; checkpoint_scn.set_max(); if (OB_FAIL(freezer->get_max_consequent_callbacked_scn(checkpoint_scn))) { STORAGE_LOG(WARN, "get_max_consequent_callbacked_scn failed", K(ret), K(freezer->get_ls_id())); } else { // used to record which handler provide the smallest rec_scn int min_rec_scn_service_type_index = 0; char service_type[common::MAX_SERVICE_TYPE_BUF_LENGTH]; get_min_rec_scn(min_rec_scn_service_type_index, checkpoint_scn); get_min_rec_scn_service_type_by_index_(min_rec_scn_service_type_index, service_type); const SCN checkpoint_scn_in_ls_meta = ls_->get_clog_checkpoint_scn(); const share::ObLSID ls_id = ls_->get_ls_id(); LSN clog_checkpoint_lsn; if (checkpoint_scn == checkpoint_scn_in_ls_meta) { STORAGE_LOG(INFO, "[CHECKPOINT] clog checkpoint no change", K(checkpoint_scn), K(checkpoint_scn_in_ls_meta), K(ls_id), K(service_type)); } else if (checkpoint_scn < checkpoint_scn_in_ls_meta) { if (min_rec_scn_service_type_index == 0) { STORAGE_LOG(INFO, "[CHECKPOINT] expexted when no log callbacked or replayed", K(checkpoint_scn), K(checkpoint_scn_in_ls_meta), K(ls_id)); } else { STORAGE_LOG(ERROR, "[CHECKPOINT] can not advance clog checkpoint", K(checkpoint_scn), K(checkpoint_scn_in_ls_meta), K(ls_id), K(service_type)); } } else if (OB_FAIL(loghandler_->locate_by_scn_coarsely(checkpoint_scn, clog_checkpoint_lsn))) { if (OB_ENTRY_NOT_EXIST == ret) { STORAGE_LOG(WARN, "no file in disk", K(ret), K(ls_id), K(checkpoint_scn)); ret = OB_SUCCESS; } else if (OB_NOT_INIT == ret) { STORAGE_LOG(WARN, "palf has been disabled", K(ret), K(checkpoint_scn), K(ls_->get_ls_id())); ret = OB_SUCCESS; } else if (OB_NEED_RETRY == ret) { STORAGE_LOG(WARN, "locate_by_scn_coarsely need retry", K(checkpoint_scn), K(ls_->get_ls_id())); ret = OB_SUCCESS; } else { STORAGE_LOG(ERROR, "locate lsn by logts failed", K(ret), K(ls_id), K(checkpoint_scn), K(checkpoint_scn_in_ls_meta)); } } else if (OB_FAIL(ls_->set_clog_checkpoint(clog_checkpoint_lsn, checkpoint_scn))) { STORAGE_LOG(WARN, "set clog checkpoint failed", K(ret), K(clog_checkpoint_lsn), K(checkpoint_scn), K(ls_id)); } else { FLOG_INFO("[CHECKPOINT] update clog checkpoint successfully", K(clog_checkpoint_lsn), K(checkpoint_scn), K(ls_id), K(service_type)); } } } else { STORAGE_LOG(WARN, "freezer should not null", K(ls_->get_ls_id())); } } else { STORAGE_LOG(WARN, "update_checkpoint is not enabled", K(ls_->get_ls_id())); } return ret; } int ObCheckpointExecutor::advance_checkpoint_by_flush(SCN recycle_scn) { int ret = OB_SUCCESS; const ObLSID ls_id = ls_->get_ls_id(); const LSN clog_checkpoint_lsn = ls_->get_clog_base_lsn(); const SCN clog_checkpoint_scn = ls_->get_clog_checkpoint_scn(); RLockGuard guard(rwlock_); if (update_checkpoint_enabled_) { // calculate recycle_scn if it is invalid(called by clog disk full situation) if (!recycle_scn.is_valid() && OB_FAIL(calculate_recycle_scn_(clog_checkpoint_lsn, clog_checkpoint_scn, recycle_scn))) { STORAGE_LOG(WARN, "calculate recycle scn failed", KR(ret)); } if (OB_FAIL(ret)) { } else if (OB_FAIL(check_need_flush_(clog_checkpoint_scn, recycle_scn))) { STORAGE_LOG(WARN, "no need flush"); } else { STORAGE_LOG(INFO, "start flush", K(recycle_scn), K(clog_checkpoint_scn), K(ls_id)); for (int i = 1; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) { int tmp_ret = OB_SUCCESS; if (OB_NOT_NULL(handlers_[i]) && OB_TMP_FAIL(handlers_[i]->flush(recycle_scn))) { STORAGE_LOG(WARN, "handler flush failed", KR(tmp_ret), K(recycle_scn), K(tmp_ret), K(i), K(ls_id)); } } } } else { STORAGE_LOG(WARN, "update_checkpoint is not enabled", K(ls_id)); } return ret; } int ObCheckpointExecutor::calculate_recycle_scn_(const LSN clog_checkpoint_lsn, const SCN clog_checkpoint_scn, SCN &recycle_scn) { int ret = OB_SUCCESS; LSN end_lsn; // locate_by_lsn_coarsely may return a recycle_scn less than checkpoint_scn // so if prev_recycle_scn_ <= clog_checkpoint_scn, the recycle_scn is still needed to be calculated again if (prev_clog_checkpoint_lsn_.is_valid() && (prev_clog_checkpoint_lsn_ == clog_checkpoint_lsn) && prev_recycle_scn_.is_valid() && (prev_recycle_scn_ > clog_checkpoint_scn)) { recycle_scn = prev_recycle_scn_; reuse_recycle_scn_times_++; if (reuse_recycle_scn_times_ % 1000 == 0) { STORAGE_LOG_RET(WARN, 0, "attention! clog checkpiont has not changed for a long time"); recycle_scn.set_max(); } STORAGE_LOG(INFO, "clog checkpoint has not changed yet. use previous recycle_scn to advance checkpoint", K(reuse_recycle_scn_times_), K(clog_checkpoint_lsn), K(recycle_scn)); } else if (OB_FAIL(loghandler_->get_end_lsn(end_lsn))) { STORAGE_LOG(WARN, "get end lsn failed", K(ret), K(ls_->get_ls_id())); } else { LSN calcu_recycle_lsn = clog_checkpoint_lsn + ((end_lsn - clog_checkpoint_lsn) * CLOG_GC_PERCENT / 100); if (OB_FAIL(loghandler_->locate_by_lsn_coarsely(calcu_recycle_lsn, recycle_scn))) { STORAGE_LOG(WARN, "locate_by_lsn_coarsely failed", K(calcu_recycle_lsn), K(recycle_scn), K(ls_->get_ls_id())); } else { prev_clog_checkpoint_lsn_ = clog_checkpoint_lsn; prev_recycle_scn_ = recycle_scn; reuse_recycle_scn_times_ = 0; STORAGE_LOG(INFO, "advance checkpoint by flush to avoid clog disk full", K(recycle_scn), K(end_lsn), K(clog_checkpoint_lsn), K(calcu_recycle_lsn), K(ls_->get_ls_id())); } } return ret; } int ObCheckpointExecutor::check_need_flush_(const SCN clog_checkpoint_scn, const SCN recycle_scn) { int ret = OB_SUCCESS; SCN max_decided_scn; const ObLSID ls_id = ls_->get_ls_id(); if (recycle_scn.is_max()) { // must do flush } else if (recycle_scn < clog_checkpoint_scn) { ret = OB_NO_NEED_UPDATE; STORAGE_LOG(WARN, "recycle_scn should not smaller than checkpoint_log_scn", K(recycle_scn), K(clog_checkpoint_scn), K(ls_id)); } else if (OB_FAIL(loghandler_->get_max_decided_scn(max_decided_scn))) { STORAGE_LOG(WARN, "failed to get_max_decided_scn", K(recycle_scn), K(clog_checkpoint_scn), K(ls_id)); } else if (recycle_scn > max_decided_scn) { ret = OB_EAGAIN; STORAGE_LOG(WARN, "recycle_scn is larger than max_decided_scn", K(recycle_scn), K(clog_checkpoint_scn), K(ls_id), K(max_decided_scn)); } return ret; } int ObCheckpointExecutor::get_checkpoint_info(ObIArray &checkpoint_array) { int ret = OB_SUCCESS; checkpoint_array.reset(); for (int i = 1; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) { if (OB_NOT_NULL(handlers_[i])) { ObCheckpointVTInfo info; info.rec_scn = handlers_[i]->get_rec_scn(); info.service_type = i; checkpoint_array.push_back(info); } } return ret; } int64_t ObCheckpointExecutor::get_cannot_recycle_log_size() { int ret = OB_SUCCESS; int64_t cannot_recycle_log_size = 0; LSN end_lsn; if (OB_FAIL(loghandler_->get_end_lsn(end_lsn))) { STORAGE_LOG(WARN, "get end lsn failed", K(ret), K(ls_->get_ls_id())); } else { cannot_recycle_log_size = end_lsn.val_ - ls_->get_clog_base_lsn().val_; } return cannot_recycle_log_size; } int ObCheckpointExecutor::diagnose(CheckpointDiagnoseInfo &diagnose_info) const { int ret = OB_SUCCESS; RLockGuard guard(rwlock_); int log_type_index = 0; diagnose_info.checkpoint_ = ls_->get_clog_checkpoint_scn(); diagnose_info.min_rec_scn_.set_max(); get_min_rec_scn(log_type_index, diagnose_info.min_rec_scn_); ObLogBaseType log_type = static_cast(log_type_index); diagnose_info.log_type_ = log_type; return ret; } int ObCheckpointExecutor::traversal_flush() const { int ret = OB_SUCCESS; ObLSTxService *ls_tx_ser = nullptr; if (!update_checkpoint_enabled_) { STORAGE_LOG(WARN, "update_checkpoint is not enabled", K(ls_->get_ls_id())); } else if (OB_ISNULL(ls_tx_ser = ls_->get_tx_svr())) { ret = OB_ERR_UNEXPECTED; STORAGE_LOG(WARN, "ls_tx_ser should not be null", K(ret), K(ls_->get_ls_id())); } else if (OB_FAIL(ls_tx_ser->traversal_flush())) { STORAGE_LOG(WARN, "ls_tx_ser flush failed", K(ret), K(ls_->get_ls_id())); } return ret; } } // namespace checkpoint } // namespace storage } // namespace oceanbase