Files
oceanbase/src/storage/checkpoint/ob_checkpoint_executor.cpp
2024-02-28 10:44:42 +00:00

370 lines
13 KiB
C++

/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX STORAGE
#include "storage/ls/ob_ls.h"
#include "storage/checkpoint/ob_checkpoint_executor.h"
#include "storage/tx_storage/ob_checkpoint_service.h"
#include "storage/checkpoint/ob_data_checkpoint.h"
#include "share/ob_force_print_log.h"
#include "logservice/ob_log_base_type.h"
namespace oceanbase
{
using namespace share;
using namespace logservice;
namespace storage
{
namespace checkpoint
{
ObCheckpointExecutor::ObCheckpointExecutor()
: rwlock_(common::ObLatchIds::CLOG_CKPT_RWLOCK),
update_checkpoint_enabled_(false),
reuse_recycle_scn_times_(0),
prev_clog_checkpoint_lsn_(),
prev_recycle_scn_()
{
reset();
}
ObCheckpointExecutor::~ObCheckpointExecutor()
{
reset();
}
void ObCheckpointExecutor::reset()
{
for (int i = 0; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) {
handlers_[i] = NULL;
}
ls_ = NULL;
loghandler_ = NULL;
reuse_recycle_scn_times_ = 0;
prev_clog_checkpoint_lsn_.reset();
prev_recycle_scn_.set_invalid();
}
int ObCheckpointExecutor::register_handler(const ObLogBaseType &type,
ObICheckpointSubHandler *handler)
{
int ret = OB_SUCCESS;
if (!is_valid_log_base_type(type) || NULL == handler) {
ret = OB_INVALID_ARGUMENT;
STORAGE_LOG(WARN, "invalid arguments", K(ret), K(type), K(handler));
} else {
if (OB_NOT_NULL(handlers_[type])) {
STORAGE_LOG(WARN, "repeat register into checkpoint_executor", K(ret), K(type), K(handler));
} else {
handlers_[type] = handler;
}
}
return ret;
}
void ObCheckpointExecutor::unregister_handler(const ObLogBaseType &type)
{
int ret = OB_SUCCESS;
if (!is_valid_log_base_type(type)) {
ret = OB_INVALID_ARGUMENT;
STORAGE_LOG(WARN, "invalid arguments", K(ret), K(type));
} else {
handlers_[type] = NULL;
}
}
int ObCheckpointExecutor::init(ObLS *ls, ObILogHandler *loghandler)
{
int ret = OB_SUCCESS;
ls_ = ls;
loghandler_ = loghandler;
return ret;
}
void ObCheckpointExecutor::start()
{
online();
}
void ObCheckpointExecutor::online()
{
WLockGuard guard(rwlock_);
update_checkpoint_enabled_ = true;
}
void ObCheckpointExecutor::offline()
{
WLockGuard guard(rwlock_);
update_checkpoint_enabled_ = false;
}
void ObCheckpointExecutor::get_min_rec_scn(int &log_type, SCN &min_rec_scn) const
{
for (int i = 1; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) {
if (OB_NOT_NULL(handlers_[i])) {
SCN rec_scn = handlers_[i]->get_rec_scn();
if (rec_scn > SCN::min_scn() && rec_scn < min_rec_scn) {
min_rec_scn = rec_scn;
log_type = i;
}
}
}
}
inline void get_min_rec_scn_service_type_by_index_(int index, char* service_type)
{
int ret = OB_SUCCESS;
if (index == 0) {
strncpy(service_type ,"MAX_DECIDED_SCN", common::MAX_SERVICE_TYPE_BUF_LENGTH);
} else if (OB_FAIL(log_base_type_to_string(ObLogBaseType(index),
service_type,
common::MAX_SERVICE_TYPE_BUF_LENGTH))) {
STORAGE_LOG(WARN, "log_base_type_to_string failed", K(ret), K(index));
strncpy(service_type ,"UNKNOWN_SERVICE_TYPE", common::MAX_SERVICE_TYPE_BUF_LENGTH);
}
}
int ObCheckpointExecutor::update_clog_checkpoint()
{
int ret = OB_SUCCESS;
WLockGuard guard_for_update_clog_checkpoint(rwlock_for_update_clog_checkpoint_);
RLockGuard guard(rwlock_);
if (update_checkpoint_enabled_) {
ObFreezer *freezer = ls_->get_freezer();
if (OB_NOT_NULL(freezer)) {
SCN checkpoint_scn;
checkpoint_scn.set_max();
if (OB_FAIL(freezer->get_max_consequent_callbacked_scn(checkpoint_scn))) {
STORAGE_LOG(WARN, "get_max_consequent_callbacked_scn failed", K(ret), K(freezer->get_ls_id()));
} else {
// used to record which handler provide the smallest rec_scn
int min_rec_scn_service_type_index = 0;
char service_type[common::MAX_SERVICE_TYPE_BUF_LENGTH];
get_min_rec_scn(min_rec_scn_service_type_index, checkpoint_scn);
get_min_rec_scn_service_type_by_index_(min_rec_scn_service_type_index, service_type);
const SCN checkpoint_scn_in_ls_meta = ls_->get_clog_checkpoint_scn();
const share::ObLSID ls_id = ls_->get_ls_id();
LSN clog_checkpoint_lsn;
if (checkpoint_scn == checkpoint_scn_in_ls_meta) {
STORAGE_LOG(INFO, "[CHECKPOINT] clog checkpoint no change", K(checkpoint_scn),
K(checkpoint_scn_in_ls_meta), K(ls_id), K(service_type));
} else if (checkpoint_scn < checkpoint_scn_in_ls_meta) {
if (min_rec_scn_service_type_index == 0) {
STORAGE_LOG(INFO, "[CHECKPOINT] expexted when no log callbacked or replayed",
K(checkpoint_scn), K(checkpoint_scn_in_ls_meta), K(ls_id));
} else {
STORAGE_LOG(ERROR, "[CHECKPOINT] can not advance clog checkpoint", K(checkpoint_scn),
K(checkpoint_scn_in_ls_meta), K(ls_id), K(service_type));
}
} else if (OB_FAIL(loghandler_->locate_by_scn_coarsely(checkpoint_scn, clog_checkpoint_lsn))) {
if (OB_ENTRY_NOT_EXIST == ret) {
STORAGE_LOG(WARN, "no file in disk", K(ret), K(ls_id), K(checkpoint_scn));
ret = OB_SUCCESS;
} else if (OB_NOT_INIT == ret) {
STORAGE_LOG(WARN, "palf has been disabled", K(ret), K(checkpoint_scn), K(ls_->get_ls_id()));
ret = OB_SUCCESS;
} else if (OB_NEED_RETRY == ret) {
STORAGE_LOG(WARN, "locate_by_scn_coarsely need retry", K(checkpoint_scn), K(ls_->get_ls_id()));
ret = OB_SUCCESS;
} else {
STORAGE_LOG(ERROR, "locate lsn by logts failed", K(ret), K(ls_id),
K(checkpoint_scn), K(checkpoint_scn_in_ls_meta));
}
} else if (OB_FAIL(ls_->set_clog_checkpoint(clog_checkpoint_lsn, checkpoint_scn))) {
STORAGE_LOG(WARN, "set clog checkpoint failed", K(ret), K(clog_checkpoint_lsn), K(checkpoint_scn), K(ls_id));
} else {
FLOG_INFO("[CHECKPOINT] update clog checkpoint successfully",
K(clog_checkpoint_lsn), K(checkpoint_scn), K(ls_id),
K(service_type));
}
}
} else {
STORAGE_LOG(WARN, "freezer should not null", K(ls_->get_ls_id()));
}
} else {
STORAGE_LOG(WARN, "update_checkpoint is not enabled", K(ls_->get_ls_id()));
}
return ret;
}
int ObCheckpointExecutor::advance_checkpoint_by_flush(SCN recycle_scn)
{
int ret = OB_SUCCESS;
const ObLSID ls_id = ls_->get_ls_id();
const LSN clog_checkpoint_lsn = ls_->get_clog_base_lsn();
const SCN clog_checkpoint_scn = ls_->get_clog_checkpoint_scn();
RLockGuard guard(rwlock_);
if (update_checkpoint_enabled_) {
// calculate recycle_scn if it is invalid(called by clog disk full situation)
if (!recycle_scn.is_valid() &&
OB_FAIL(calculate_recycle_scn_(clog_checkpoint_lsn, clog_checkpoint_scn, recycle_scn))) {
STORAGE_LOG(WARN, "calculate recycle scn failed", KR(ret));
}
if (OB_FAIL(ret)) {
} else if (OB_FAIL(check_need_flush_(clog_checkpoint_scn, recycle_scn))) {
STORAGE_LOG(WARN, "no need flush");
} else {
STORAGE_LOG(INFO, "start flush", K(recycle_scn), K(clog_checkpoint_scn), K(ls_id));
for (int i = 1; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) {
int tmp_ret = OB_SUCCESS;
if (OB_NOT_NULL(handlers_[i]) && OB_TMP_FAIL(handlers_[i]->flush(recycle_scn))) {
STORAGE_LOG(WARN, "handler flush failed", KR(tmp_ret), K(recycle_scn), K(tmp_ret), K(i), K(ls_id));
}
}
}
} else {
STORAGE_LOG(WARN, "update_checkpoint is not enabled", K(ls_id));
}
return ret;
}
int ObCheckpointExecutor::calculate_recycle_scn_(const LSN clog_checkpoint_lsn,
const SCN clog_checkpoint_scn,
SCN &recycle_scn)
{
int ret = OB_SUCCESS;
LSN end_lsn;
// locate_by_lsn_coarsely may return a recycle_scn less than checkpoint_scn
// so if prev_recycle_scn_ <= clog_checkpoint_scn, the recycle_scn is still needed to be calculated again
if (prev_clog_checkpoint_lsn_.is_valid() && (prev_clog_checkpoint_lsn_ == clog_checkpoint_lsn) &&
prev_recycle_scn_.is_valid() && (prev_recycle_scn_ > clog_checkpoint_scn)) {
recycle_scn = prev_recycle_scn_;
reuse_recycle_scn_times_++;
if (reuse_recycle_scn_times_ % 1000 == 0) {
STORAGE_LOG_RET(WARN, 0, "attention! clog checkpiont has not changed for a long time");
recycle_scn.set_max();
}
STORAGE_LOG(INFO,
"clog checkpoint has not changed yet. use previous recycle_scn to advance checkpoint",
K(reuse_recycle_scn_times_),
K(clog_checkpoint_lsn),
K(recycle_scn));
} else if (OB_FAIL(loghandler_->get_end_lsn(end_lsn))) {
STORAGE_LOG(WARN, "get end lsn failed", K(ret), K(ls_->get_ls_id()));
} else {
LSN calcu_recycle_lsn = clog_checkpoint_lsn + ((end_lsn - clog_checkpoint_lsn) * CLOG_GC_PERCENT / 100);
if (OB_FAIL(loghandler_->locate_by_lsn_coarsely(calcu_recycle_lsn, recycle_scn))) {
STORAGE_LOG(WARN, "locate_by_lsn_coarsely failed", K(calcu_recycle_lsn), K(recycle_scn), K(ls_->get_ls_id()));
} else {
prev_clog_checkpoint_lsn_ = clog_checkpoint_lsn;
prev_recycle_scn_ = recycle_scn;
reuse_recycle_scn_times_ = 0;
STORAGE_LOG(INFO,
"advance checkpoint by flush to avoid clog disk full",
K(recycle_scn),
K(end_lsn),
K(clog_checkpoint_lsn),
K(calcu_recycle_lsn),
K(ls_->get_ls_id()));
}
}
return ret;
}
int ObCheckpointExecutor::check_need_flush_(const SCN clog_checkpoint_scn, const SCN recycle_scn)
{
int ret = OB_SUCCESS;
SCN max_decided_scn;
const ObLSID ls_id = ls_->get_ls_id();
if (recycle_scn.is_max()) {
// must do flush
} else if (recycle_scn < clog_checkpoint_scn) {
ret = OB_NO_NEED_UPDATE;
STORAGE_LOG(WARN,
"recycle_scn should not smaller than checkpoint_log_scn",
K(recycle_scn),
K(clog_checkpoint_scn),
K(ls_id));
} else if (OB_FAIL(loghandler_->get_max_decided_scn(max_decided_scn))) {
STORAGE_LOG(WARN, "failed to get_max_decided_scn", K(recycle_scn), K(clog_checkpoint_scn), K(ls_id));
} else if (recycle_scn > max_decided_scn) {
ret = OB_EAGAIN;
STORAGE_LOG(WARN,
"recycle_scn is larger than max_decided_scn",
K(recycle_scn),
K(clog_checkpoint_scn),
K(ls_id),
K(max_decided_scn));
}
return ret;
}
int ObCheckpointExecutor::get_checkpoint_info(ObIArray<ObCheckpointVTInfo> &checkpoint_array)
{
int ret = OB_SUCCESS;
checkpoint_array.reset();
for (int i = 1; i < ObLogBaseType::MAX_LOG_BASE_TYPE; i++) {
if (OB_NOT_NULL(handlers_[i])) {
ObCheckpointVTInfo info;
info.rec_scn = handlers_[i]->get_rec_scn();
info.service_type = i;
checkpoint_array.push_back(info);
}
}
return ret;
}
int64_t ObCheckpointExecutor::get_cannot_recycle_log_size()
{
int ret = OB_SUCCESS;
int64_t cannot_recycle_log_size = 0;
LSN end_lsn;
if (OB_FAIL(loghandler_->get_end_lsn(end_lsn))) {
STORAGE_LOG(WARN, "get end lsn failed", K(ret), K(ls_->get_ls_id()));
} else {
cannot_recycle_log_size = end_lsn.val_ - ls_->get_clog_base_lsn().val_;
}
return cannot_recycle_log_size;
}
int ObCheckpointExecutor::diagnose(CheckpointDiagnoseInfo &diagnose_info) const
{
int ret = OB_SUCCESS;
RLockGuard guard(rwlock_);
int log_type_index = 0;
diagnose_info.checkpoint_ = ls_->get_clog_checkpoint_scn();
diagnose_info.min_rec_scn_.set_max();
get_min_rec_scn(log_type_index, diagnose_info.min_rec_scn_);
ObLogBaseType log_type = static_cast<ObLogBaseType>(log_type_index);
diagnose_info.log_type_ = log_type;
return ret;
}
int ObCheckpointExecutor::traversal_flush() const
{
int ret = OB_SUCCESS;
ObLSTxService *ls_tx_ser = nullptr;
if (!update_checkpoint_enabled_) {
STORAGE_LOG(WARN, "update_checkpoint is not enabled", K(ls_->get_ls_id()));
} else if (OB_ISNULL(ls_tx_ser = ls_->get_tx_svr())) {
ret = OB_ERR_UNEXPECTED;
STORAGE_LOG(WARN, "ls_tx_ser should not be null", K(ret), K(ls_->get_ls_id()));
} else if (OB_FAIL(ls_tx_ser->traversal_flush())) {
STORAGE_LOG(WARN, "ls_tx_ser flush failed", K(ret), K(ls_->get_ls_id()));
}
return ret;
}
} // namespace checkpoint
} // namespace storage
} // namespace oceanbase