Files
oceanbase/src/storage/ls/ob_ls_tablet_service.cpp
2023-11-01 08:13:07 +00:00

6437 lines
264 KiB
C++
Executable File

/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX STORAGE
#include "storage/ls/ob_ls_tablet_service.h"
#include "common/row/ob_row_store.h"
#include "lib/objectpool/ob_server_object_pool.h"
#include "lib/utility/ob_macro_utils.h"
#include "lib/utility/utility.h"
#include "logservice/ob_log_base_header.h"
#include "logservice/ob_log_base_type.h"
#include "logservice/ob_log_service.h"
#include "share/scn.h"
#include "observer/report/ob_i_meta_report.h"
#include "share/ob_disk_usage_table_operator.h"
#include "share/rc/ob_tenant_base.h"
#include "share/schema/ob_table_param.h"
#include "share/schema/ob_table_dml_param.h"
#include "share/schema/ob_tenant_schema_service.h"
#include "share/ob_ddl_common.h"
#include "storage/blocksstable/index_block/ob_index_block_builder.h"
#include "storage/blocksstable/ob_sstable_meta.h"
#include "storage/ob_dml_running_ctx.h"
#include "storage/ob_partition_range_spliter.h"
#include "storage/ob_query_iterator_factory.h"
#include "storage/ob_relative_table.h"
#include "storage/ob_row_reshape.h"
#include "storage/ob_storage_struct.h"
#include "storage/ob_storage_table_guard.h"
#include "storage/ob_value_row_iterator.h"
#include "storage/access/ob_table_scan_iterator.h"
#include "storage/access/ob_table_scan_range.h"
#include "storage/access/ob_rows_info.h"
#include "storage/access/ob_table_scan_range.h"
#include "storage/access/ob_rows_info.h"
#include "storage/access/ob_table_estimator.h"
#include "storage/access/ob_index_sstable_estimator.h"
#include "storage/column_store/ob_column_oriented_sstable.h"
#include "storage/blocksstable/ob_sstable.h"
#include "storage/ls/ob_ls.h"
#include "storage/tablet/ob_tablet.h"
#include "storage/tablet/ob_tablet_iterator.h"
#include "storage/tablet/ob_tablet_binding_helper.h"
#include "storage/tablet/ob_tablet_create_delete_helper.h"
#include "storage/tablet/ob_tablet_create_sstable_param.h"
#include "storage/tablet/ob_tablet_persister.h"
#include "storage/tablet/ob_tablet_service_clog_replay_executor.h"
#include "storage/tablet/ob_tablet_status.h"
#include "storage/tablet/ob_tablet_slog_helper.h"
#include "storage/tablet/ob_tablet_persister.h"
#include "storage/tx/ob_trans_define.h"
#include "storage/tx/ob_trans_part_ctx.h"
#include "storage/tx_storage/ob_ls_service.h"
#include "storage/meta_mem/ob_tablet_map_key.h"
#include "storage/meta_mem/ob_tenant_meta_mem_mgr.h"
#include "storage/slog/ob_storage_log_replayer.h"
#include "storage/slog/ob_storage_log_struct.h"
#include "storage/slog/ob_storage_logger.h"
#include "share/ob_lob_access_utils.h"
#include "observer/table_load/ob_table_load_table_ctx.h"
#include "observer/table_load/ob_table_load_coordinator.h"
#include "observer/table_load/ob_table_load_service.h"
#include "observer/table_load/ob_table_load_store.h"
#include "observer/ob_server_event_history_table_operator.h"
#include "storage/high_availability/ob_storage_ha_utils.h"
using namespace oceanbase::share;
using namespace oceanbase::common;
using namespace oceanbase::transaction;
using namespace oceanbase::blocksstable;
using namespace oceanbase::observer;
namespace oceanbase
{
namespace storage
{
using namespace mds;
ObLSTabletService::ObLSTabletService()
: ls_(nullptr),
tx_data_memtable_mgr_(),
tx_ctx_memtable_mgr_(),
lock_memtable_mgr_(),
mds_table_mgr_(),
tablet_id_set_(),
bucket_lock_(),
allow_to_read_mgr_(),
is_inited_(false),
is_stopped_(false)
{
}
ObLSTabletService::~ObLSTabletService()
{
}
int ObLSTabletService::init(
ObLS *ls)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(is_inited_)) {
ret = OB_INIT_TWICE;
LOG_WARN("init twice", K(ret), K_(is_inited));
} else if (OB_ISNULL(ls)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ls));
} else if (OB_FAIL(tablet_id_set_.init(ObTabletCommon::BUCKET_LOCK_BUCKET_CNT, MTL_ID()))) {
LOG_WARN("fail to init tablet id set", K(ret));
} else if (OB_FAIL(bucket_lock_.init(ObTabletCommon::BUCKET_LOCK_BUCKET_CNT,
ObLatchIds::TABLET_BUCKET_LOCK, "TabletSvrBucket", MTL_ID()))) {
LOG_WARN("failed to init bucket lock", K(ret));
} else if (OB_FAIL(set_allow_to_read_(ls))) {
LOG_WARN("failed to set allow to read", K(ret));
} else if (OB_FAIL(mds_table_mgr_.init(ls))) {
LOG_WARN("fail to init mds table mgr", KR(ret));
} else {
ls_ = ls;
is_stopped_ = false;
is_inited_ = true;
}
if (OB_UNLIKELY(!is_inited_)) {
destroy();
}
return ret;
}
void ObLSTabletService::destroy()
{
delete_all_tablets();
tablet_id_set_.destroy();
tx_data_memtable_mgr_.destroy();
tx_ctx_memtable_mgr_.destroy();
lock_memtable_mgr_.destroy();
mds_table_mgr_.destroy();
bucket_lock_.destroy();
ls_= nullptr;
is_stopped_ = false;
is_inited_ = false;
}
int ObLSTabletService::stop()
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else {
is_stopped_ = true;
}
return ret;
}
int ObLSTabletService::offline()
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_FAIL(offline_build_tablet_without_memtable_())) {
LOG_WARN("failed to offline build tablet without memtable", K(ret));
} else if (OB_FAIL(offline_destroy_memtable_and_mds_table_())) {
LOG_WARN("failed to offline destroy memtable and mds table", K(ret));
} else {
mds_table_mgr_.offline();
}
return ret;
}
int ObLSTabletService::online()
{
return OB_SUCCESS;
}
int ObLSTabletService::replay(
const void *buffer,
const int64_t nbytes,
const palf::LSN &lsn,
const SCN &scn)
{
int ret = OB_SUCCESS;
int64_t pos = 0;
logservice::ObLogBaseHeader base_header;
common::ObTabletID tablet_id;
const char *log_buf = static_cast<const char *>(buffer);
ObTabletServiceClogReplayExecutor replayer_executor;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_FAIL(base_header.deserialize(log_buf, nbytes, pos))) {
LOG_WARN("log base header deserialize error", K(ret));
} else if (logservice::ObLogBaseType::STORAGE_SCHEMA_LOG_BASE_TYPE != base_header.get_log_type()) {
ret = OB_NOT_SUPPORTED;
LOG_WARN("log type not supported", K(ret), "log_type", base_header.get_log_type());
} else if (OB_FAIL(tablet_id.deserialize(log_buf, nbytes, pos))) {
LOG_WARN("fail to deserialize tablet id", K(ret), KP(log_buf), K(nbytes), K(pos));
} else if (OB_FAIL(replayer_executor.init(log_buf, nbytes, pos, scn))) {
LOG_WARN("failed to init replayer", K(ret), KP(log_buf), K(nbytes), K(pos), K(lsn), K(scn));
} else if (OB_FAIL(replayer_executor.execute(scn, ls_->get_ls_id(), tablet_id))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_SUCCESS; // TODO (bowen.gbw): unify multi data replay logic
LOG_INFO("tablet does not exist, skip", K(ret), K(replayer_executor));
} else if (OB_TIMEOUT == ret) {
LOG_INFO("replace timeout errno", KR(ret), K(replayer_executor));
ret = OB_EAGAIN;
} else {
LOG_WARN("failed to replay", K(ret), K(replayer_executor));
}
}
return ret;
}
void ObLSTabletService::switch_to_follower_forcedly()
{
// TODO
}
int ObLSTabletService::switch_to_leader()
{
int ret = OB_SUCCESS;
//TODO
return ret;
}
int ObLSTabletService::switch_to_follower_gracefully()
{
int ret = OB_SUCCESS;
//TODO
return ret;
}
int ObLSTabletService::resume_leader()
{
int ret = OB_SUCCESS;
//TODO
return ret;
}
int ObLSTabletService::flush(SCN &recycle_scn)
{
UNUSED(recycle_scn);
return OB_SUCCESS;
}
SCN ObLSTabletService::get_rec_scn()
{
return SCN::max_scn();
}
int ObLSTabletService::prepare_for_safe_destroy()
{
int ret = OB_SUCCESS;
if (OB_FAIL(delete_all_tablets())) {
LOG_WARN("fail to delete all tablets", K(ret));
}
#ifdef ERRSIM
if (!ls_->get_ls_id().is_sys_ls()) {
SERVER_EVENT_SYNC_ADD("ls_tablet_service", "after_delete_all_tablets",
"tenant_id", MTL_ID(),
"ls_id", ls_->get_ls_id().id());
DEBUG_SYNC(AFTER_LS_GC_DELETE_ALL_TABLETS);
}
#endif
return ret;
}
int ObLSTabletService::safe_to_destroy(bool &is_safe)
{
int ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
is_safe = true;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else {
int64_t tx_data_memtable_mgr_ref = tx_data_memtable_mgr_.get_ref();
int64_t tx_ctx_memtable_mgr_ref = tx_ctx_memtable_mgr_.get_ref();
int64_t lock_memtable_mgr_ref = lock_memtable_mgr_.get_ref();
int64_t mds_table_mgr_ref = mds_table_mgr_.get_ref();
if (0 != tx_data_memtable_mgr_ref || 0 != tx_ctx_memtable_mgr_ref
|| 0 != lock_memtable_mgr_ref || 0 != mds_table_mgr_ref) {
if (REACH_TIME_INTERVAL(60L * 1000000)) { // 60s
LOG_WARN("inner tablet memtable mgr can't destroy", K(tx_data_memtable_mgr_ref),
K(tx_ctx_memtable_mgr_ref), K(lock_memtable_mgr_ref), K(mds_table_mgr_ref));
}
is_safe = false;
} else {
tx_data_memtable_mgr_.destroy();
tx_ctx_memtable_mgr_.destroy();
lock_memtable_mgr_.destroy();
mds_table_mgr_.destroy();
}
if (is_safe) {
bool is_wait_gc = false;
if (OB_FAIL(t3m->has_meta_wait_gc(is_wait_gc))) {
LOG_WARN("failed to check has_meta_wait_gc", K(ret));
is_safe = false;
} else {
is_safe = !is_wait_gc;
}
}
}
return ret;
}
int ObLSTabletService::delete_all_tablets()
{
int ret = OB_SUCCESS;
if (OB_NOT_NULL(ls_)) {
const ObLSID &ls_id = ls_->get_ls_id();
ObSArray<ObTabletID> tablet_id_array;
GetAllTabletIDOperator op(tablet_id_array);
ObTimeGuard time_guard("ObLSTabletService::delete_all_tablets", 1_s);
common::ObBucketWLockAllGuard lock_guard(bucket_lock_);
time_guard.click("Lock");
if (OB_FAIL(tablet_id_set_.foreach(op))) {
LOG_WARN("failed to traverse tablet id set", K(ret), K(ls_id));
} else if (tablet_id_array.empty()) {
// tablet id array is empty, do nothing
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < tablet_id_array.count(); ++i) {
const ObTabletID &tablet_id = tablet_id_array.at(i);
if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) {
LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id));
ob_usleep(1000 * 1000);
ob_abort();
}
}
time_guard.click("RemoveTablet");
if (OB_SUCC(ret)) {
report_tablet_to_rs(tablet_id_array);
time_guard.click("ReportToRS");
}
}
}
return ret;
}
int ObLSTabletService::remove_tablet(const ObTabletHandle& tablet_handle)
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_handle.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid tablet", K(ret), K(tablet_handle));
} else {
const ObTablet &target_tablet = *(tablet_handle.get_obj());
const ObLSID ls_id = ls_->get_ls_id();
const ObTabletID tablet_id = target_tablet.get_tablet_meta().tablet_id_;
const ObTabletMapKey key(ls_id, tablet_id);
ObTabletHandle cur_tablet_handle;
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
if (OB_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, cur_tablet_handle))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_SUCCESS;
LOG_INFO("tablet does not exist, maybe already deleted", K(ret), K(key));
} else {
LOG_WARN("failed to get tablet", K(ret), K(key));
}
} else if (&target_tablet != cur_tablet_handle.get_obj()) {
ret = OB_EAGAIN;
LOG_INFO("tablet object has been changed, need retry", K(ret), K(key), K(target_tablet), KPC(cur_tablet_handle.get_obj()));
} else {
if (OB_FAIL(ObTabletSlogHelper::write_remove_tablet_slog(ls_id, tablet_id))) {
LOG_WARN("failed to write remove tablet slog", K(ret), K(ls_id), K(tablet_id));
} else if (OB_FAIL(tablet_handle.get_obj()->wait_release_memtables())) {
LOG_ERROR("failed to release memtables", K(ret), K(tablet_id));
} else if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) {
LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id));
ob_usleep(1000 * 1000);
ob_abort();
} else {
report_tablet_to_rs(tablet_id);
}
}
}
return ret;
}
int ObLSTabletService::remove_tablets(const common::ObIArray<common::ObTabletID> &tablet_id_array)
{
int ret = OB_SUCCESS;
const int64_t tablet_cnt = tablet_id_array.count();
ObSArray<uint64_t> all_tablet_id_hash_array;
ObSArray<ObTabletID> tablet_ids;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(0 == tablet_cnt)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args, tablet id array is empty", K(ret), K(tablet_id_array));
} else if (OB_FAIL(all_tablet_id_hash_array.reserve(tablet_cnt))) {
LOG_WARN("failed to reserve memory for array", K(ret), K(tablet_cnt));
} else if (OB_FAIL(tablet_ids.reserve(tablet_cnt))) {
LOG_WARN("failed to reserve memory for array", K(ret), K(tablet_cnt));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < tablet_cnt; ++i) {
const ObTabletID &tablet_id = tablet_id_array.at(i);
if (OB_FAIL(all_tablet_id_hash_array.push_back(tablet_id.hash()))) {
LOG_WARN("failed to push back tablet id hash value", K(ret), K(tablet_id));
}
}
}
if (OB_SUCC(ret)) {
ObMetaDiskAddr tablet_addr;
ObTimeGuard time_guard("ObLSTabletService::remove_tablets", 1_s);
ObMultiBucketLockGuard lock_guard(bucket_lock_, true/*is_write_lock*/);
if (OB_FAIL(lock_guard.lock_multi_buckets(all_tablet_id_hash_array))) {
LOG_WARN("failed to lock multi buckets", K(ret));
} else {
time_guard.click("Lock");
const share::ObLSID &ls_id = ls_->get_ls_id();
ObTabletHandle tablet_handle;
ObTabletMapKey key;
key.ls_id_ = ls_id;
// check tablet existence
for (int64_t i = 0; OB_SUCC(ret) && i < tablet_cnt; ++i) {
const ObTabletID &tablet_id = tablet_id_array.at(i);
key.tablet_id_ = tablet_id;
tablet_addr.reset();
if (OB_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, tablet_handle))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_SUCCESS;
LOG_INFO("tablet does not exist, maybe already deleted", K(ret), K(key));
} else {
LOG_WARN("failed to get tablet", K(ret), K(key));
}
} else if (OB_FAIL(tablet_handle.get_obj()->wait_release_memtables())) {
LOG_ERROR("failed to release memtables", K(ret), K(tablet_id));
} else if (OB_FAIL(tablet_handle.get_obj()->get_meta_disk_addr(tablet_addr))) {
LOG_WARN("failed to get tablet addr", K(ret), K(key));
} else if (!tablet_addr.is_disked()) {
if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) {
LOG_WARN("failed to remove non disked tablet from memory", K(ret), K(key));
} else {
FLOG_INFO("succeeded to remove non disked tablet from memory", K(ret), K(key));
}
} else if (OB_FAIL(tablet_ids.push_back(tablet_id))) {
LOG_WARN("failed to push back tablet id", K(ret), K(tablet_id));
}
}
// write slog and do remove tablet
if (OB_FAIL(ret)) {
} else if (tablet_ids.empty()) {
LOG_INFO("all tablets already deleted, do nothing", K(ret), K(ls_id), K(tablet_id_array));
} else if (OB_FAIL(ObTabletSlogHelper::write_remove_tablet_slog(ls_id, tablet_ids))) {
LOG_WARN("failed to write remove tablet slog", K(ret), K(ls_id), K(tablet_ids));
} else {
time_guard.click("WrSlog");
for (int64_t i = 0; OB_SUCC(ret) && i < tablet_ids.count(); ++i) {
const ObTabletID &tablet_id = tablet_ids.at(i);
if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) {
LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id));
ob_usleep(1000 * 1000);
ob_abort();
}
}
if (OB_SUCC(ret)) {
report_tablet_to_rs(tablet_ids);
time_guard.click("ReportToRS");
}
}
}
}
return ret;
}
int ObLSTabletService::do_remove_tablet(const ObTabletMapKey &key)
{
int ret = OB_SUCCESS;
ObTimeGuard time_guard("RmTabletLock", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash());
time_guard.click("Lock");
if (OB_FAIL(inner_remove_tablet(key.ls_id_, key.tablet_id_))) {
LOG_WARN("fail to remove tablet with lock", K(ret), K(key));
}
return ret;
}
// TODO(yunshan.tys) cope with failure of deleting tablet (tablet hasn't been loaded from disk)
int ObLSTabletService::inner_remove_tablet(
const share::ObLSID &ls_id,
const ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
const ObTabletMapKey key(ls_id, tablet_id);
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
if (OB_FAIL(tablet_id_set_.erase(tablet_id))) {
if (OB_HASH_NOT_EXIST == ret) {
// tablet id is already erased
ret = OB_SUCCESS;
} else {
LOG_WARN("fail to erase tablet id from set", K(ret), K(ls_id), K(tablet_id));
}
}
if (OB_SUCC(ret)) {
// loop retry to delete tablet from t3m
while (OB_FAIL(t3m->del_tablet(key))) {
if (REACH_TIME_INTERVAL(10 * 1000 * 1000)) {
LOG_ERROR("failed to delete tablet from t3m", K(ret), K(ls_id), K(tablet_id));
}
}
}
if (OB_SUCC(ret)) {
FLOG_INFO("succeeded to remove tablet", K(ret), K(ls_id), K(tablet_id));
}
return ret;
}
int ObLSTabletService::get_tablet(
const ObTabletID &tablet_id,
ObTabletHandle &handle,
const int64_t timeout_us,
const ObMDSGetTabletMode mode)
{
int ret = OB_SUCCESS;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid()
|| mode < ObMDSGetTabletMode::READ_ALL_COMMITED)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(mode));
} else if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle, timeout_us, mode,
ObTransVersion::MAX_TRANS_VERSION))) {
if (OB_TABLET_NOT_EXIST == ret) {
LOG_DEBUG("failed to check and get tablet", K(ret), K(key), K(timeout_us), K(mode));
} else {
LOG_WARN("failed to check and get tablet", K(ret), K(key), K(timeout_us), K(mode));
}
}
return ret;
}
int ObLSTabletService::get_tablet_addr(const ObTabletMapKey &key, ObMetaDiskAddr &addr)
{
int ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else {
// 加读锁保证ckpt与对tablet的操作串行, 防止ckpt时tablet操作处在
// slog已经写入而tablet addr未更新的状态,导致slog丢失
ObBucketHashRLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash());
if (OB_FAIL(t3m->get_tablet_addr(key, addr))) {
LOG_WARN("fail to get tablet addr", K(ret), K(key));
}
}
return ret;
}
void ObLSTabletService::report_tablet_to_rs(const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
const share::ObLSID &ls_id = ls_->get_ls_id();
if (tablet_id.is_ls_inner_tablet()) {
// no need to report for ls inner tablet
} else if (OB_FAIL(MTL(ObTabletTableUpdater*)->submit_tablet_update_task(ls_id, tablet_id))) {
LOG_WARN("failed to report tablet info", KR(ret), K(ls_id), K(tablet_id));
}
}
void ObLSTabletService::report_tablet_to_rs(
const common::ObIArray<common::ObTabletID> &tablet_id_array)
{
int ret = OB_SUCCESS;
const uint64_t tenant_id = MTL_ID();
const share::ObLSID &ls_id = ls_->get_ls_id();
// ignore ret on purpose
for (int64_t i = 0; i < tablet_id_array.count(); ++i) {
const common::ObTabletID &tablet_id = tablet_id_array.at(i);
if (tablet_id.is_ls_inner_tablet()) {
// no need to report for ls inner tablet
continue;
} else if (OB_FAIL(MTL(ObTabletTableUpdater*)->submit_tablet_update_task(ls_id, tablet_id))) {
LOG_WARN("failed to report tablet info", KR(ret), K(tenant_id), K(ls_id), K(tablet_id));
}
}
}
int ObLSTabletService::table_scan(ObTabletHandle &tablet_handle, ObTableScanIterator &iter, ObTableScanParam &param)
{
int ret = OB_SUCCESS;
NG_TRACE(S_table_scan_begin);
AllowToReadMgr::AllowToReadInfo read_info;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (FALSE_IT(allow_to_read_mgr_.load_allow_to_read_info(read_info))) {
} else if (!read_info.allow_to_read()) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_));
} else if (OB_FAIL(prepare_scan_table_param(param, *(MTL(ObTenantSchemaService*)->get_schema_service())))) {
LOG_WARN("failed to prepare scan table param", K(ret), K(param));
} else if (OB_FAIL(inner_table_scan(tablet_handle, iter, param))) {
LOG_WARN("failed to do table scan", K(ret), KP(&iter), K(param));
} else {
bool is_same = false;
allow_to_read_mgr_.check_read_info_same(read_info, is_same);
if (!is_same) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_), KP(&iter));
}
}
NG_TRACE(S_table_scan_end);
return ret;
}
int ObLSTabletService::table_rescan(ObTabletHandle &tablet_handle, ObTableScanParam &param, ObNewRowIterator *result)
{
int ret = OB_SUCCESS;
NG_TRACE(S_table_rescan_begin);
AllowToReadMgr::AllowToReadInfo read_info;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K(result), K_(is_inited));
} else if (OB_ISNULL(result)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret));
} else if (FALSE_IT(allow_to_read_mgr_.load_allow_to_read_info(read_info))) {
} else if (!read_info.allow_to_read()) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_));
} else if (OB_FAIL(prepare_scan_table_param(param, *(MTL(ObTenantSchemaService*)->get_schema_service())))) {
LOG_WARN("failed to prepare scan table param", K(ret), K(result), K(param));
} else {
ObTableScanIterator *iter = static_cast<ObTableScanIterator*>(result);
if (OB_FAIL(inner_table_scan(tablet_handle, *iter, param))) {
LOG_WARN("failed to do table scan", K(ret), K(result), K(param));
}
}
if (OB_SUCC(ret)) {
bool is_same = false;
allow_to_read_mgr_.check_read_info_same(read_info, is_same);
if (!is_same) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_));
}
}
NG_TRACE(S_table_rescan_end);
return ret;
}
int ObLSTabletService::refresh_tablet_addr(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
ObTabletHandle &tablet_handle)
{
int ret = OB_SUCCESS;
const ObTabletMapKey key(ls_id, tablet_id);
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
while (OB_SUCC(ret)) {
ret = tablet_id_set_.set(tablet_id);
if (OB_SUCC(ret)) {
break;
} else if (OB_ALLOCATE_MEMORY_FAILED == ret) {
usleep(100 * 1000);
if (REACH_COUNT_INTERVAL(100)) {
LOG_ERROR("no memory for tablet id set, retry", K(ret), K(tablet_id));
}
ret = OB_SUCCESS;
} else {
LOG_WARN("fail to set tablet id set", K(ret), K(tablet_id));
}
}
if (OB_FAIL(ret)) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) {
LOG_WARN("failed to add tablet to meta mem mgr", K(ret), K(key), K(tablet_handle));
}
return ret;
}
int ObLSTabletService::trim_old_tablets(const ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
ObTabletHandle tablet_handle_head;
ObTimeGuard time_guard("ObLSTabletService::trim_old_tablets", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle_head))) {
LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id));
} else if (tablet_handle_head.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle_head.get_obj());
} else if (OB_UNLIKELY(!tablet_handle_head.get_obj()->get_tablet_meta().has_next_tablet_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("doesn't have old tablet", K(ret), "tablet_meta", tablet_handle_head.get_obj()->get_tablet_meta());
} else {
time_guard.click("GetTablet");
ObTablet *tablet_head = tablet_handle_head.get_obj();
ObTabletHandle new_tablet_handle;
ObLSID ls_id = tablet_head->get_tablet_meta().ls_id_;
tablet_head->trim_tablet_list();
ObMetaDiskAddr disk_addr;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet_head, new_tablet_handle))) {
LOG_WARN("fail to persist and transfor tablet", K(ret), KPC(tablet_head), K(new_tablet_handle));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->get_tablet_addr())) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("failed to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(MTL(ObTenantMetaMemMgr*)->compare_and_swap_tablet(
key, tablet_handle_head, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle_head), K(new_tablet_handle));
ob_usleep(1000 * 1000);
ob_abort();
} else {
time_guard.click("CASwap");
FLOG_INFO("succeeded to trim tablets list", K(key), K(disk_addr));
}
}
return ret;
}
int ObLSTabletService::rollback_rebuild_tablet(const ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
ObTabletHandle tablet_handle_head;
ObTimeGuard time_guard("ObLSTabletService::rollback_rebuild_tablet", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle_head))) {
LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id));
} else if (tablet_handle_head.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle_head.get_obj());
} else {
time_guard.click("GetTablet");
ObTablet *tablet_head = tablet_handle_head.get_obj();
ObTabletHandle next_tablet_handle;
ObMetaObj<ObTablet> meta_obj;
tablet_head->get_next_tablet_guard().get_obj(meta_obj);
next_tablet_handle.set_obj(meta_obj);
next_tablet_handle.set_wash_priority(WashTabletPriority::WTP_LOW);
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
ObMetaDiskAddr disk_addr;
ObTabletHandle new_tablet_handle;
if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(
*next_tablet_handle.get_obj(), new_tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), K(next_tablet_handle), K(new_tablet_handle));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->get_tablet_addr())) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(
key.ls_id_, tablet_id, disk_addr))) {
LOG_WARN("failed to write update tablet slog", K(ret), K(key), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(MTL(ObTenantMetaMemMgr*)->compare_and_swap_tablet(
key, tablet_handle_head, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle_head), K(new_tablet_handle));
ob_usleep(1000 * 1000);
ob_abort();
} else {
time_guard.click("CASwap");
FLOG_INFO("succeeded to rollback rebuild", K(key), K(disk_addr));
}
}
return ret;
}
int ObLSTabletService::rebuild_tablet_with_old(
const ObMigrationTabletParam &mig_tablet_param,
ObTabletHandle &tablet_guard)
{
int ret = OB_SUCCESS;
ObTimeGuard time_guard("ObLSTabletService::rebuild_tablet_with_old", 1_s);
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "RebuildTablet"));
ObTabletHandle old_tablet_hdl;
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle new_tablet_hdl;
ObTablet *tmp_tablet = nullptr;
ObFreezer *freezer = ls_->get_freezer();
ObMetaDiskAddr disk_addr;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_;
const share::ObLSID &ls_id = mig_tablet_param.ls_id_;
const ObTabletMapKey key(ls_id, tablet_id);
if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) {
LOG_WARN("failed to get tablet", K(ret), K(key));
} else if (FALSE_IT(time_guard.click("GetTablet"))) {
} else if (old_tablet_hdl.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_hdl.get_obj());
} else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
LOG_WARN("fail to acquire temporary tablet", K(ret), K(key));
} else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) {
} else if (OB_FAIL(tmp_tablet->init_with_migrate_param(allocator, mig_tablet_param, true/*is_update*/, freezer))) {
LOG_WARN("failed to init tablet", K(ret), K(mig_tablet_param));
} else if (FALSE_IT(time_guard.click("InitTablet"))) {
} else if (FALSE_IT(tmp_tablet->set_next_tablet_guard(tablet_guard))) {
} else if (FALSE_IT(time_guard.click("InitTablet"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_hdl, new_tablet_hdl))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_hdl), K(new_tablet_hdl));
ob_usleep(1000 * 1000);
ob_abort();
} else if (OB_FAIL(new_tablet_hdl.get_obj()->start_ddl_if_need())) {
LOG_WARN("start ddl if need failed", K(ret), K(key));
} else {
time_guard.click("CASwap");
LOG_INFO("rebuild tablet with old succeed", K(ret), K(key), K(disk_addr));
}
return ret;
}
int ObLSTabletService::migrate_update_tablet(
const ObMigrationTabletParam &mig_tablet_param)
{
int ret = OB_SUCCESS;
ObTimeGuard time_guard("ObLSTabletService::migrate_update_tablet", 1_s);
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "MigUpTab"));
const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_;
const share::ObLSID &ls_id = mig_tablet_param.ls_id_;
const ObTabletMapKey key(mig_tablet_param.ls_id_, mig_tablet_param.tablet_id_);
ObTabletHandle old_tablet_hdl;
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle new_tablet_hdl;
ObTablet *new_tablet = nullptr;
ObMetaDiskAddr disk_addr;
ObFreezer *freezer = ls_->get_freezer();
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) {
LOG_WARN("failed to get tablet", K(ret), K(key));
} else if (FALSE_IT(time_guard.click("GetTablet"))) {
} else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
LOG_WARN("fail to acquire temporary tablet", K(ret), K(key));
} else if (FALSE_IT(new_tablet = tmp_tablet_hdl.get_obj())) {
} else if (OB_FAIL(new_tablet->init_with_migrate_param(allocator, mig_tablet_param, true/*is_update*/, freezer))) {
LOG_WARN("failed to init tablet", K(ret), K(mig_tablet_param));
} else if (FALSE_IT(time_guard.click("InitTablet"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*new_tablet, new_tablet_hdl))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(new_tablet), K(new_tablet_hdl));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_hdl, new_tablet_hdl))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_hdl), K(new_tablet_hdl));
ob_usleep(1000 * 1000);
ob_abort();
} else if (OB_FAIL(new_tablet_hdl.get_obj()->start_ddl_if_need())) {
LOG_WARN("start ddl if need failed", K(ret));
} else {
time_guard.click("CASwap");
LOG_INFO("migrate update tablet succeed", K(ret), K(key), K(disk_addr));
}
return ret;
}
int ObLSTabletService::migrate_create_tablet(
const ObMigrationTabletParam &mig_tablet_param,
ObTabletHandle &handle)
{
int ret = OB_SUCCESS;
ObTimeGuard time_guard("ObLSTabletService::migrate_create_tablet", 1_s);
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "MigCreateTab"));
const share::ObLSID &ls_id = mig_tablet_param.ls_id_;
const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_;
const ObTabletMapKey key(ls_id, tablet_id);
ObFreezer *freezer = ls_->get_freezer();
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle tablet_handle;
ObMetaDiskAddr disk_addr;
if (OB_FAIL(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
LOG_WARN("fail to create temporary tablet", K(ret), K(key));
} else if (OB_FAIL(tmp_tablet_hdl.get_obj()->init_with_migrate_param(allocator, mig_tablet_param, false/*is_update*/, freezer))) {
LOG_WARN("fail to init tablet", K(ret), K(mig_tablet_param));
} else if (FALSE_IT(time_guard.click("InitTablet"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet_hdl.get_obj(), tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), K(tmp_tablet_hdl), K(tablet_handle));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = tablet_handle.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(refresh_tablet_addr(ls_id, tablet_id, tablet_handle))) {
LOG_WARN("failed to refresh tablet addr", K(ret), K(ls_id), K(tablet_id), K(lbt()));
ob_usleep(1000 * 1000);
ob_abort();
} else if (FALSE_IT(time_guard.click("RefreshAddr"))) {
} else if (OB_FAIL(tablet_handle.get_obj()->start_ddl_if_need())) {
LOG_WARN("start ddl if need failed", K(ret));
} else {
LOG_INFO("migrate create tablet succeed", K(ret), K(key), K(disk_addr));
}
if (OB_SUCC(ret)) {
handle = tablet_handle;
} else {
int tmp_ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
if (OB_TMP_FAIL(tablet_id_set_.erase(tablet_id))) {
if (OB_HASH_NOT_EXIST != tmp_ret) {
LOG_ERROR("fail to erase tablet id from set", K(tmp_ret), K(tablet_id));
}
}
if (OB_TMP_FAIL(inner_remove_tablet(key.ls_id_, key.tablet_id_))) {
LOG_WARN("fail to erase tablet from meta memory manager", K(tmp_ret), K(key));
}
}
return ret;
}
int ObLSTabletService::refresh_memtable_for_ckpt(
const ObMetaDiskAddr &old_addr,
const ObMetaDiskAddr &cur_addr,
ObTabletHandle &new_tablet_handle)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!old_addr.is_equal_for_persistence(cur_addr))) {
ret = OB_NOT_THE_OBJECT;
LOG_WARN("the old tablet has been replaced", K(ret), K(old_addr), K(cur_addr));
} else if (OB_UNLIKELY(old_addr != cur_addr)) {
// memtables were updated
if (OB_FAIL(new_tablet_handle.get_obj()->refresh_memtable_and_update_seq(cur_addr.seq()))) {
LOG_WARN("fail to pull newest memtables", K(ret), K(old_addr), K(cur_addr), K(new_tablet_handle));
}
}
return ret;
}
int ObLSTabletService::update_tablet_checkpoint(
const ObTabletMapKey &key,
const ObMetaDiskAddr &old_addr,
const ObMetaDiskAddr &new_addr,
const bool is_replay_old,
ObTabletHandle &new_handle)
{
int ret = OB_SUCCESS;
ObTimeGuard time_guard("UpdateTabletCKPT", 3_s);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ls tablet svr hasn't been inited", K(ret));
} else if (OB_UNLIKELY(!key.is_valid()
|| !old_addr.is_valid()
|| !new_addr.is_valid()
|| !new_addr.is_block()
|| (!is_replay_old && !new_handle.is_valid()))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(key), K(new_addr), K(new_handle));
} else {
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "CKPTUpdate"));
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObTabletHandle tablet_handle;
ObMetaDiskAddr addr;
ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash());
time_guard.click("Lock");
if (OB_FAIL(t3m->get_tablet_addr(key, addr))) {
if (OB_ENTRY_NOT_EXIST == ret) {
ret = OB_TABLET_NOT_EXIST;
}
LOG_WARN("fail to get old tablet addr", K(ret), K(key));
} else if (!is_replay_old) {
if (OB_FAIL(t3m->get_tablet(WashTabletPriority::WTP_LOW, key, tablet_handle))) {
LOG_WARN("fail to get tablet", K(ret), K(key));
} else if (FALSE_IT(time_guard.click("GetOld"))) {
} else if (OB_FAIL(refresh_memtable_for_ckpt(old_addr, addr, new_handle))) {
LOG_WARN("fail to update tablet", K(ret), K(old_addr), K(addr), K(new_handle));
} else if (FALSE_IT(time_guard.click("UpdateTablet"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_handle))) {
LOG_WARN("fail to compare and swap tablet", K(ret), K(tablet_handle), K(new_handle));
}
} else {
time_guard.click("GetOld");
if (OB_UNLIKELY(addr != old_addr)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("the old tablet has been replaced, which is not allowed during upgrade",
K(ret), K(addr), K(old_addr));
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_addr, new_addr))) {
LOG_WARN("fail to compare and swap tablet", K(ret), K(old_addr), K(new_addr));
}
}
if (OB_SUCC(ret)) {
time_guard.click("CASwap");
FLOG_INFO("succeeded to update tablet ckpt", K(key), K(old_addr), K(new_addr),
K(is_replay_old));
}
}
return ret;
}
int ObLSTabletService::update_tablet_table_store(
const ObTabletHandle &old_tablet_handle,
const ObIArray<storage::ObITable *> &tables)
{
int ret = OB_SUCCESS;
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "UpTabStore"));
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ls tablet svr hasn't been inited", K(ret));
} else if (OB_UNLIKELY(!old_tablet_handle.is_valid() || 0 == tables.count())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("old tablet handle is invalid", K(ret), K(old_tablet_handle), K(tables.count()));
} else {
ObTablet *old_tablet = old_tablet_handle.get_obj();
const common::ObTabletID &tablet_id = old_tablet->get_tablet_meta().tablet_id_;
ObTimeGuard time_guard("ObLSTabletService::ReplaceSSTable", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObTabletHandle tablet_handle;
if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_EAGAIN;
LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id));
} else {
LOG_WARN("fail to get tablet", K(ret));
}
} else if (tablet_handle.get_obj() != old_tablet) {
ret = OB_EAGAIN;
LOG_WARN("tablet has changed, skip it", K(ret), K(tablet_handle), K(old_tablet_handle));
} else if (old_tablet->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet);
} else {
time_guard.click("GetTablet");
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle new_tablet_hdl;
ObTablet *tmp_tablet = nullptr;
const share::ObLSID &ls_id = ls_->get_ls_id();
const ObTabletMapKey key(ls_id, tablet_id);
ObMetaDiskAddr disk_addr;
if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
LOG_WARN("fail to acquire temporary tablet", K(ret), K(key));
} else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) {
} else if (OB_FAIL(tmp_tablet->init_for_defragment(allocator, tables, *old_tablet))) {
LOG_WARN("fail to init new tablet", K(ret), KPC(old_tablet));
} else if (FALSE_IT(time_guard.click("InitTablet"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl));
} else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_hdl))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_hdl));
ob_usleep(1000 * 1000);
ob_abort();
} else {
time_guard.click("CASwap");
LOG_INFO("succeeded to build new tablet", K(ret), K(disk_addr),
K(new_tablet_hdl), KPC(new_tablet_hdl.get_obj()));
}
}
}
return ret;
}
int ObLSTabletService::update_tablet_table_store(
const common::ObTabletID &tablet_id,
const ObUpdateTableStoreParam &param,
ObTabletHandle &handle)
{
int ret = OB_SUCCESS;
common::ObArenaAllocator allocator("UpdateTmpTablet", OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID(), ObCtxIds::DEFAULT_CTX_ID);
if (share::is_reserve_mode()) {
// TODO(@DanLing) use LocalArena later
allocator.set_ctx_id(ObCtxIds::MERGE_RESERVE_CTX_ID);
}
const share::ObLSID &ls_id = ls_->get_ls_id();
const ObTabletMapKey key(ls_id, tablet_id);
ObTabletHandle old_tablet_hdl;
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle new_tablet_hdl;
ObTimeGuard time_guard("ObLSTabletService::UpdateTableStore", 1_s);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || !param.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(param));
} else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
if (OB_ENTRY_NOT_EXIST == ret) {
ret = OB_TABLET_NOT_EXIST;
} else {
LOG_WARN("fail to acquire temporary tablet", K(ret), K(key));
}
} else {
ObTablet *tmp_tablet = tmp_tablet_hdl.get_obj();
time_guard.click("Acquire");
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (old_tablet_hdl.get_obj()->is_empty_shell()) {
handle = old_tablet_hdl;
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_hdl.get_obj());
} else {
time_guard.click("GetTablet");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObTablet *old_tablet = old_tablet_hdl.get_obj();
ObMetaDiskAddr disk_addr;
if (OB_FAIL(tmp_tablet->init_for_merge(allocator, param, *old_tablet))) {
LOG_WARN("failed to init tablet", K(ret), K(param), KPC(old_tablet));
} else if (FALSE_IT(time_guard.click("InitNew"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl));
} else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_hdl, new_tablet_hdl))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_hdl), K(new_tablet_hdl));
ob_usleep(1000 * 1000);
ob_abort();
} else if (FALSE_IT(time_guard.click("CASwap"))) {
} else {
handle = new_tablet_hdl;
LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(param), K(handle));
}
}
}
return ret;
}
int ObLSTabletService::update_tablet_mstx(
const ObTabletMapKey &key,
const ObMetaDiskAddr &old_addr,
const ObTabletHandle &old_tablet_handle,
ObTabletHandle &new_tablet_handle)
{
int ret = OB_SUCCESS;
ObTablet *new_tablet = nullptr;
ObMetaDiskAddr new_addr;
ObTimeGuard time_guard("ObLSTabletService::update_tablet_mstx", 1_s);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!key.is_valid()
|| !old_addr.is_valid()
|| !old_tablet_handle.is_valid()
|| !new_tablet_handle.is_valid()
|| !(new_tablet = new_tablet_handle.get_obj())->is_valid()
|| !(new_addr = new_tablet->get_tablet_addr()).is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(key), K(old_addr), K(old_tablet_handle),
K(new_tablet_handle), KPC(new_tablet), K(new_addr));
} else {
ObMetaDiskAddr addr;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash());
time_guard.click("Lock");
ObTabletHandle curr_tablet_handle;
if (OB_FAIL(direct_get_tablet(key.tablet_id_, curr_tablet_handle))) {
if (OB_ENTRY_NOT_EXIST == ret) {
ret = OB_SUCCESS; // deleted, skip
} else {
LOG_WARN("fail to get tablet", K(ret), K(key));
}
} else if (curr_tablet_handle.get_obj() != old_tablet_handle.get_obj()) {
// we could never persist this tablet, skip this
LOG_INFO("tablet has been changed", K(ret), K(key), K(old_addr), K(old_tablet_handle), K(curr_tablet_handle));
} else if (FALSE_IT(addr = curr_tablet_handle.get_obj()->get_tablet_addr())) {
} else if (old_addr != addr) { /* the same full tablet obj with different memtables will hit this */
// Let this updating fail and throw tablet back to the persist queue.
// It will be tackled correctly in the next round because its address will be compared
// again in ObFullTabletCreator::persist_tablet()
ret = common::OB_NOT_THE_OBJECT;
LOG_WARN("old address has changed, skip update", K(ret), K(key), K(addr), K(old_addr));
} else {
time_guard.click("GetOld");
if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, key.tablet_id_, new_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(key), K(new_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_handle));
ob_usleep(1000 * 1000);
ob_abort();
} else if (FALSE_IT(time_guard.click("CASwap"))) {
} else {
FLOG_INFO("succeeded to update tablet mstx", K(ret),
K(key), K(old_addr), K(old_tablet_handle), K(new_addr), K(new_tablet_handle));
}
}
}
return ret;
}
int ObLSTabletService::update_tablet_to_empty_shell(const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
const share::ObLSID &ls_id = ls_->get_ls_id();
const ObTabletMapKey key(ls_id, tablet_id);
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "UpdEmptySh"));
ObTabletHandle new_tablet_handle;
ObTabletHandle tmp_tablet_handle;
ObTabletHandle old_tablet_handle;
ObTimeGuard time_guard("UpdateTabletToEmptyShell", 3_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ls tablet svr hasn't been inited", K(ret));
} else if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id));
} else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (old_tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj());
} else if (FALSE_IT(time_guard.click("GetOld"))) {
} else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_handle))) {
LOG_WARN("fail to acquire temporary tablet", K(ret), K(key));
} else {
time_guard.click("Acquire");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObTablet *old_tablet = old_tablet_handle.get_obj();
ObTablet *tmp_tablet = tmp_tablet_handle.get_obj();
ObTablet *new_tablet = nullptr;
ObMetaDiskAddr disk_addr;
if (OB_FAIL(tmp_tablet->init_empty_shell(*tmp_tablet_handle.get_allocator(), *old_tablet))) {
LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet));
} else if (FALSE_IT(time_guard.click("InitNew"))) {
} else if (OB_FAIL(ObTabletPersister::transform_empty_shell(*tmp_tablet, new_tablet_handle))) {
LOG_WARN("fail to transform emtpy shell", K(ret), K(tablet_id));
} else if (FALSE_IT(time_guard.click("Trans"))) {
} else if (FALSE_IT(new_tablet = new_tablet_handle.get_obj())) {
} else if (OB_FAIL(ObTabletSlogHelper::write_empty_shell_tablet_slog(new_tablet, disk_addr))) {
LOG_WARN("fail to write emtpy shell tablet slog", K(ret), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(new_tablet->tablet_addr_ = disk_addr)) {
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_handle));
ob_usleep(1000 * 1000);
ob_abort();
} else {
ls_->get_tablet_gc_handler()->set_tablet_gc_trigger();
time_guard.click("CASwap");
LOG_INFO("succeeded to build empty shell tablet", K(ret), K(key), K(disk_addr));
}
}
return ret;
}
int ObLSTabletService::update_medium_compaction_info(
const common::ObTabletID &tablet_id,
ObTabletHandle &handle)
{
int ret = OB_SUCCESS;
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "UpMeidumCom"));
ObTabletHandle old_tablet_handle;
ObTimeGuard time_guard("ObLSTabletService::update_medium_compaction_info", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id));
} else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) {
LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id));
} else if (old_tablet_handle.get_obj()->is_empty_shell()) {
handle = old_tablet_handle;
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj());
} else {
time_guard.click("GetTablet");
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle new_tablet_hdl;
ObTablet *tmp_tablet = nullptr;
ObTablet *old_tablet = old_tablet_handle.get_obj();
const share::ObLSID &ls_id = ls_->get_ls_id();
const ObTabletMapKey key(ls_id, tablet_id);
ObMetaDiskAddr disk_addr;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
if (OB_ENTRY_NOT_EXIST == ret) {
ret = OB_TABLET_NOT_EXIST;
} else {
LOG_WARN("failed to acquire tablet", K(ret), K(key));
}
} else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) {
} else if (OB_FAIL(tmp_tablet->init_with_update_medium_info(allocator, *old_tablet))) {
LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet));
} else if (FALSE_IT(time_guard.click("InitNew"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl));
} else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_hdl))) {
LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_hdl));
} else if (FALSE_IT(time_guard.click("CASwap"))) {
} else {
handle = new_tablet_hdl;
}
}
return ret;
}
int ObLSTabletService::build_new_tablet_from_mds_table(
const common::ObTabletID &tablet_id,
const int64_t mds_construct_sequence,
const share::SCN &flush_scn)
{
TIMEGUARD_INIT(STORAGE, 10_ms);
int ret = OB_SUCCESS;
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "BuildMSD"));
const share::ObLSID &ls_id = ls_->get_ls_id();
const ObTabletMapKey key(ls_id, tablet_id);
ObTabletHandle old_tablet_handle;
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle new_tablet_handle;
ObTimeGuard time_guard("MdsDump", 3_s);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id));
} else if (CLICK_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
LOG_WARN("failed to acquire tablet", K(ret), K(key));
} else {
ObTablet *tmp_tablet = tmp_tablet_hdl.get_obj();
time_guard.click("Acquire");
CLICK();
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (CLICK_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (old_tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip mds table dump operation", K(ret),
"old_tablet", *old_tablet_handle.get_obj());
} else {
time_guard.click("GetOld");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObTablet *old_tablet = old_tablet_handle.get_obj();
ObMetaDiskAddr disk_addr;
ObArenaAllocator arena_allocator(common::ObMemAttr(MTL_ID(), "mds_reader"));
ObTabletMdsData mds_data;
if (OB_FAIL(ret)) {
} else if (CLICK_FAIL(old_tablet->read_mds_table(arena_allocator, mds_data, true, mds_construct_sequence))) {
if (OB_EMPTY_RESULT == ret) {
ret = OB_SUCCESS;
LOG_INFO("read nothing from mds table, no need to build new tablet", K(ret), K(key));
} else {
LOG_WARN("failed to read mds table", K(ret), K(key));
}
} else if (CLICK_FAIL(tmp_tablet->init_for_mds_table_dump(allocator, *old_tablet, flush_scn, mds_data, old_tablet->mds_data_))) {
LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet), K(flush_scn));
} else if (CLICK_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_handle));
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) {
} else if (CLICK_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (CLICK_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(disk_addr), K(old_tablet_handle));
ob_usleep(1000 * 1000);
ob_abort();
} else {
CLICK();
time_guard.click("CASwap");
LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(new_tablet_handle), K(mds_data));
}
}
}
return ret;
}
int ObLSTabletService::update_tablet_release_memtable_for_offline(
const common::ObTabletID &tablet_id,
const SCN scn)
{
int ret = OB_SUCCESS;
const ObLSID ls_id(ls_->get_ls_id());
const ObTabletMapKey key(ls_id, tablet_id);
ObTabletHandle tablet_handle;
ObTablet *tablet = nullptr;
ObTimeGuard time_guard("ObLSTabletService::update_tablet_release_memtable", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || !scn.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(scn));
} else if (OB_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, tablet_handle))) {
LOG_WARN("fail to direct get tablet", K(ret), K(key));
} else if (OB_ISNULL(tablet = tablet_handle.get_obj())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("tablet should not be NULL", K(ret), K(key));
} else if (tablet->is_empty_shell()) {
//do nothing
} else {
time_guard.click("get_tablet");
ObITable *table = nullptr;
ObTableStoreIterator iter;
const bool is_from_buf_pool = nullptr == tablet_handle.get_obj()->get_allocator();
if (is_from_buf_pool) {
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObTabletHandle new_tablet_handle;
if (OB_FAIL(ObTabletPersister::copy_from_old_tablet(*tablet, new_tablet_handle))) {
LOG_WARN("fail to copy from old tablet", K(ret), KPC(tablet));
} else if (FALSE_IT(time_guard.click("CpTablet"))) {
} else if (OB_FAIL(new_tablet_handle.get_obj()->rebuild_memtables(scn))) {
LOG_WARN("fail to rebuild memtables", K(ret), K(scn), K(new_tablet_handle));
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle));
} else {
time_guard.click("CASwap");
LOG_INFO("succeeded to copy tablet to release memtable", K(ret), K(key), K(tablet_handle), K(new_tablet_handle));
}
} else if (OB_UNLIKELY(!tablet->get_tablet_addr().is_memory())) {
ret = OB_NOT_SUPPORTED;
LOG_ERROR("This tablet is full tablet, but its addr isn't memory", K(ret), KPC(tablet));
} else if (OB_FAIL(tablet->get_all_sstables(iter))) {
LOG_WARN("fail to get all sstable", K(ret), K(iter));
} else if (1 == iter.count() && OB_FAIL(iter.get_next(table))) {
LOG_WARN("fail to get next table", K(ret), K(iter));
} else if (OB_UNLIKELY(iter.count() > 1)
|| (OB_NOT_NULL(table) && (!table->is_sstable()
|| static_cast<ObSSTable *>(table)->get_data_macro_block_count() != 0))) {
ret = OB_NOT_SUPPORTED;
LOG_ERROR("This tablet is full tablet, but all of its sstables isn't only one empty major",
K(ret), K(iter), KPC(table));
} else if (OB_FAIL(tablet_handle.get_obj()->wait_release_memtables())) {
LOG_ERROR("failed to release memtables", K(ret), K(tablet_id));
} else if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) {
LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id));
} else {
time_guard.click("RmTablet");
}
}
return ret;
}
int ObLSTabletService::update_tablet_report_status(
const common::ObTabletID &tablet_id,
const bool found_column_group_checksum_error)
{
int ret = OB_SUCCESS;
ObTabletHandle tablet_handle;
ObTimeGuard time_guard("ObLSTabletService::update_tablet_report_status", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id));
} else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj());
} else {
time_guard.click("GetTablet");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObMetaDiskAddr disk_addr;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
ObTablet *tablet = tablet_handle.get_obj();
ObTabletHandle new_tablet_handle;
bool need_report = true;
if (OB_UNLIKELY(found_column_group_checksum_error)) {
tablet->tablet_meta_.report_status_.found_cg_checksum_error_ = true;
} else if (tablet->tablet_meta_.report_status_.need_report()) {
tablet->tablet_meta_.report_status_.cur_report_version_ = tablet->tablet_meta_.report_status_.merge_snapshot_version_;
} else {
need_report = false;
FLOG_INFO("tablet doesn't need to report", K(ret), K(tablet_id));
}
if (need_report) {
if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) {
LOG_WARN("failed to write update tablet slog", K(ret), K(key), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle));
ob_usleep(1000 * 1000);
ob_abort();
} else {
time_guard.click("CASwap");
LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(tablet_handle));
}
}
}
return ret;
}
int ObLSTabletService::update_tablet_snapshot_version(
const common::ObTabletID &tablet_id,
const int64_t snapshot_version)
{
int ret = OB_SUCCESS;
common::ObArenaAllocator allocator;
ObTabletHandle old_tablet_handle;
ObTimeGuard time_guard("ObLSTabletService::update_tablet_snapshot_version", 1 * 1000 * 1000);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || 0 >= snapshot_version)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(snapshot_version));
} else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) {
LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id));
} else {
time_guard.click("GetTablet");
ObTabletHandle tmp_tablet_hdl;
ObTabletHandle new_tablet_hdl;
ObTablet *tmp_tablet = nullptr;
ObTablet *old_tablet = old_tablet_handle.get_obj();
const share::ObLSID &ls_id = ls_->get_ls_id();
const ObTabletMapKey key(ls_id, tablet_id);
ObMetaDiskAddr disk_addr;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
if (OB_ENTRY_NOT_EXIST == ret) {
ret = OB_TABLET_NOT_EXIST;
} else {
LOG_WARN("failed to acquire tablet", K(ret), K(key));
}
} else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) {
} else if (OB_FAIL(tmp_tablet->init_with_new_snapshot_version(allocator, *old_tablet, snapshot_version))) {
LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet));
} else if (FALSE_IT(time_guard.click("InitNew"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl));
} else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_hdl))) {
LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_hdl));
} else {
time_guard.click("CASwap");
}
}
return ret;
}
int ObLSTabletService::update_tablet_restore_status(
const common::ObTabletID &tablet_id,
const ObTabletRestoreStatus::STATUS &restore_status)
{
int ret = OB_SUCCESS;
ObTabletHandle tablet_handle;
ObTabletRestoreStatus::STATUS current_status = ObTabletRestoreStatus::RESTORE_STATUS_MAX;
bool can_change = false;
ObTimeGuard time_guard("ObLSTabletService::update_tablet_restore_status", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid())
|| OB_UNLIKELY(!ObTabletRestoreStatus::is_valid(restore_status))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(restore_status));
} else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj());
} else {
time_guard.click("GetTablet");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObMetaDiskAddr disk_addr;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
ObTablet *tablet = tablet_handle.get_obj();
ObTabletHandle new_tablet_handle;
if (OB_FAIL(tablet->tablet_meta_.ha_status_.get_restore_status(current_status))) {
LOG_WARN("failed to get restore status", K(ret), KPC(tablet));
} else if (OB_FAIL(ObTabletRestoreStatus::check_can_change_status(current_status, restore_status, can_change))) {
LOG_WARN("failed to check can change status", K(ret), K(current_status), K(restore_status), KPC(tablet));
} else if (!can_change) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("can not change restore status", K(ret), K(current_status), K(restore_status), KPC(tablet));
} else if (OB_FAIL(tablet->tablet_meta_.ha_status_.set_restore_status(restore_status))) {
LOG_WARN("failed to set restore status", K(ret), K(restore_status), KPC(tablet));
} else if (restore_status == ObTabletRestoreStatus::UNDEFINED
&& OB_FALSE_IT((void)tablet->tablet_meta_.reset_transfer_table())) {
} else {
// TODO(jiahua.cjh) move check valid to tablet init after generate new version tablet.
if (OB_FAIL(tablet->check_valid())) {
LOG_WARN("failed to check tablet valid", K(ret), K(restore_status), KPC(tablet));
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) {
LOG_WARN("failed to write update tablet slog", K(ret), K(key), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle));
ob_abort();
} else {
time_guard.click("CASwap");
LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(restore_status), K(tablet_handle));
}
if (OB_FAIL(ret)) {
int tmp_ret = OB_SUCCESS;
if (OB_SUCCESS != (tmp_ret = tablet->tablet_meta_.ha_status_.set_restore_status(current_status))) {
LOG_WARN("failed to set restore status", K(tmp_ret), K(current_status), KPC(tablet));
ob_abort();
}
}
}
}
return ret;
}
int ObLSTabletService::update_tablet_ha_data_status(
const common::ObTabletID &tablet_id,
const ObTabletDataStatus::STATUS &data_status)
{
int ret = OB_SUCCESS;
ObTabletHandle tablet_handle;
ObTabletDataStatus::STATUS current_status = ObTabletDataStatus::DATA_STATUS_MAX;
bool can_change = false;
ObTimeGuard time_guard("ObLSTabletService::update_tablet_ha_data_status", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(is_stopped_)) {
ret = OB_NOT_RUNNING;
LOG_WARN("tablet service stopped", K(ret));
} else if (OB_UNLIKELY(!tablet_id.is_valid())
|| OB_UNLIKELY(!ObTabletDataStatus::is_valid(data_status))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(data_status));
} else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj());
} else {
time_guard.click("GetTablet");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObMetaDiskAddr disk_addr;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
ObTablet *tablet = tablet_handle.get_obj();
ObTabletHandle new_tablet_handle;
if (OB_FAIL(tablet->tablet_meta_.ha_status_.get_data_status(current_status))) {
LOG_WARN("failed to get data status", K(ret), KPC(tablet));
} else if (OB_FAIL(ObTabletDataStatus::check_can_change_status(current_status, data_status, can_change))) {
LOG_WARN("failed to check can change status", K(ret), K(current_status), K(data_status), KPC(tablet));
} else if (!can_change) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("can not change data status", K(ret), K(current_status), K(data_status), KPC(tablet));
} else if (current_status == data_status) {
LOG_INFO("data status is same, skip update", K(tablet_id), K(current_status), K(data_status));
} else if (OB_FAIL(tablet->tablet_meta_.ha_status_.set_data_status(data_status))) {
LOG_WARN("failed to set data status", K(ret), KPC(tablet), K(data_status));
} else {
if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) {
LOG_WARN("failed to write update tablet slog", K(ret), K(tablet_handle), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle));
ob_usleep(1000 * 1000);
ob_abort();
} else {
time_guard.click("CASwap");
LOG_INFO("succeeded to update tablet ha data status", K(ret), K(key), K(disk_addr), K(data_status), K(tablet_handle));
}
if (OB_FAIL(ret)) {
int tmp_ret = OB_SUCCESS;
if (OB_SUCCESS != (tmp_ret = tablet->tablet_meta_.ha_status_.set_data_status(current_status))) {
LOG_WARN("failed to set data status", K(tmp_ret), K(current_status), KPC(tablet));
ob_abort();
}
}
}
}
return ret;
}
int ObLSTabletService::update_tablet_ha_expected_status(
const common::ObTabletID &tablet_id,
const ObTabletExpectedStatus::STATUS &expected_status)
{
int ret = OB_SUCCESS;
ObTabletHandle tablet_handle;
ObTabletExpectedStatus::STATUS current_status = ObTabletExpectedStatus::EXPECTED_STATUS_MAX;
bool can_change = false;
ObTimeGuard time_guard("ObLSTabletService::update_tablet_ha_data_status", 1_s);
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(is_stopped_)) {
ret = OB_NOT_RUNNING;
LOG_WARN("tablet service stopped", K(ret));
} else if (OB_UNLIKELY(!tablet_id.is_valid())
|| OB_UNLIKELY(!ObTabletExpectedStatus::is_valid(expected_status))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(expected_status));
} else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj());
} else {
time_guard.click("GetTablet");
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObMetaDiskAddr disk_addr;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
ObTablet *tablet = tablet_handle.get_obj();
ObTabletHandle new_tablet_handle;
if (OB_FAIL(tablet->tablet_meta_.ha_status_.get_expected_status(current_status))) {
LOG_WARN("failed to get data status", K(ret), KPC(tablet));
} else if (expected_status == current_status) {
LOG_INFO("tablet ha expected status is same, no need update", K(tablet_id),
K(current_status), K(expected_status));
} else if (OB_FAIL(ObTabletExpectedStatus::check_can_change_status(current_status, expected_status, can_change))) {
LOG_WARN("failed to check can change status", K(ret), K(current_status), K(expected_status), KPC(tablet));
} else if (!can_change) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("can not change meta status", K(ret), K(current_status), K(expected_status), KPC(tablet));
} else {
if (OB_FAIL(tablet->tablet_meta_.ha_status_.set_expected_status(expected_status))) {
LOG_WARN("failed to set ha meta status", K(ret), KPC(tablet), K(expected_status));
} else {
if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle));
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) {
LOG_WARN("failed to write update tablet slog", K(ret), K(tablet_handle), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle));
usleep(1000 * 1000);
ob_abort();
} else {
time_guard.click("CASwap");
LOG_INFO("succeeded to update tablet meta status", K(ret), K(key), K(disk_addr), K(expected_status), KPC(tablet));
}
if (OB_FAIL(ret)) {
int tmp_ret = OB_SUCCESS;
if (OB_SUCCESS != (tmp_ret = tablet->tablet_meta_.ha_status_.set_expected_status(current_status))) {
LOG_WARN("failed to set expected status", K(tmp_ret), K(current_status), KPC(tablet));
ob_abort();
}
}
}
}
}
return ret;
}
int ObLSTabletService::replay_create_tablet(
const ObMetaDiskAddr &disk_addr,
const char *buf,
const int64_t buf_len,
const ObTabletID &tablet_id,
ObTabletTransferInfo &tablet_transfer_info)
{
int ret = OB_SUCCESS;
bool b_exist = false;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObFreezer *freezer = ls_->get_freezer();
const ObLSID &ls_id = ls_->get_ls_id();
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret));
} else if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) {
LOG_WARN("fail to check tablet existence", K(ret), K(ls_id), K(tablet_id));
} else if (b_exist) {
ret = OB_ERR_UNEXPECTED;
LOG_ERROR("restart replay tablet should not exist", K(ret), K(ls_id), K(tablet_id));
} else {
ObTimeGuard time_guard("ObLSTabletService::replay_create_tablet", 1_s);
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "ReplayCreate"));
const ObTabletMapKey key(ls_id, tablet_id);
ObTabletHandle tablet_hdl;
ObTablet *tablet = nullptr;
int64_t pos = 0;
ObMetaDiskAddr old_addr;
ObTabletPoolType pool_type;
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (OB_FAIL(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tablet_hdl))) {
LOG_WARN("fail to create temporary tablet", K(ret), K(key));
} else if (FALSE_IT(tablet = tablet_hdl.get_obj())) {
} else if (FALSE_IT(tablet->tablet_addr_ = disk_addr)) {
} else if (OB_FAIL(t3m->get_tablet_addr(key, old_addr))) {
LOG_WARN("fail to get tablet addr", K(ret), K(key));
} else if (OB_FAIL(tablet->deserialize(allocator, buf, buf_len, pos))) {
LOG_WARN("fail to deserialize tablet", K(ret), K(buf), K(buf_len), K(pos));
} else if (FALSE_IT(time_guard.click("Deserialize"))) {
} else if (OB_FAIL(tablet->init_shared_params(ls_id,
tablet_id,
tablet->get_tablet_meta().max_sync_storage_schema_version_,
tablet->get_tablet_meta().max_serialized_medium_scn_,
tablet->get_tablet_meta().compat_mode_,
freezer))) {
LOG_WARN("failed to init shared params", K(ret), K(ls_id), K(tablet_id));
} else if (OB_FAIL(tablet_id_set_.set(tablet_id))) {
LOG_WARN("fail to set tablet id set", K(ret), K(tablet_id));
} else {
if (tablet->is_empty_shell()) {
pool_type = ObTabletPoolType::TP_NORMAL;
} else {
const int64_t try_cache_size = tablet->get_try_cache_size();
if (try_cache_size > ObTenantMetaMemMgr::NORMAL_TABLET_POOL_SIZE) {
pool_type = ObTabletPoolType::TP_LARGE;
} else {
pool_type = ObTabletPoolType::TP_NORMAL;
}
}
}
if (OB_FAIL(ret)) {
// do nothing
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_addr, disk_addr, pool_type, true /* whether to set tablet pool */))) {
LOG_WARN("fail to compare and swap tablat in t3m", K(ret), K(key), K(old_addr), K(disk_addr));
} else if (FALSE_IT(time_guard.click("CASwap"))) {
} else if (OB_FAIL(tablet->check_and_set_initial_state())) {
LOG_WARN("fail to check and set initial state", K(ret), K(key));
} else if (OB_FAIL(tablet->start_ddl_if_need())) {
LOG_WARN("start ddl if need failed", K(ret));
} else if (OB_FAIL(tablet->inc_macro_ref_cnt())) {
LOG_WARN("fail to increase macro blocks' ref cnt for meta and data", K(ret));
}
if (OB_SUCC(ret)) {
tablet_transfer_info = tablet->get_tablet_meta().transfer_info_;
FLOG_INFO("succeeded to replay create one tablet", K(ret), K(ls_id), K(tablet_id), KPC(tablet));
} else {
int tmp_ret = OB_SUCCESS;
if (OB_TMP_FAIL(tablet_id_set_.erase(tablet_id))) {
if (OB_HASH_NOT_EXIST != tmp_ret) {
LOG_ERROR("fail to erase tablet id from set", K(tmp_ret), K(tablet_id));
}
}
if (OB_TMP_FAIL(inner_remove_tablet(key.ls_id_, key.tablet_id_))) {
LOG_WARN("fail to erase tablet from meta memory manager", K(tmp_ret), K(key));
}
}
}
return ret;
}
int ObLSTabletService::get_tablet_with_timeout(
const common::ObTabletID &tablet_id,
ObTabletHandle &handle,
const int64_t retry_timeout_us,
const ObMDSGetTabletMode mode,
const share::SCN &snapshot)
{
int ret = OB_SUCCESS;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
const int64_t timeout_step_us = 10 * 1000 * 1000; // 10s
const int64_t snapshot_version = snapshot.get_val_for_tx();
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid()
|| mode < ObMDSGetTabletMode::READ_ALL_COMMITED)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(mode));
} else if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle, timeout_step_us, mode, snapshot_version))) {
while (OB_ALLOCATE_MEMORY_FAILED == ret && ObClockGenerator::getClock() < retry_timeout_us) {
ret = ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle, timeout_step_us, mode, snapshot_version);
}
if (OB_ALLOCATE_MEMORY_FAILED == ret) {
ret = OB_TIMEOUT;
LOG_WARN("get tablet timeout", K(ret), K(retry_timeout_us), K(ObTimeUtil::current_time()), K(mode));
}
}
return ret;
}
int ObLSTabletService::direct_get_tablet(const common::ObTabletID &tablet_id, ObTabletHandle &handle)
{
TIMEGUARD_INIT(STORAGE, 10_ms);
int ret = OB_SUCCESS;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
if (CLICK_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, handle))) {
LOG_WARN("failed to get tablet from t3m", K(ret), K(key));
}
return ret;
}
int ObLSTabletService::inner_table_scan(
ObTabletHandle &tablet_handle,
ObTableScanIterator &iter,
ObTableScanParam &param)
{
// NOTICE: ObTableScanParam for_update_ param is ignored here,
// upper layer will handle it, so here for_update_ is always false
int ret = OB_SUCCESS;
ObStoreCtx &store_ctx = iter.get_ctx_guard().get_store_ctx();
int64_t data_max_schema_version = 0;
bool is_bounded_staleness_read = (NULL == param.trans_desc_)
? false
: param.snapshot_.is_weak_read();
if (OB_UNLIKELY(!tablet_handle.is_valid()) || OB_UNLIKELY(!param.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_handle), K(param));
} else if (is_bounded_staleness_read
&& OB_FAIL(tablet_handle.get_obj()->get_max_schema_version(data_max_schema_version))) {
LOG_WARN("failed to get max schema version", K(ret), K(param));
} else if (is_bounded_staleness_read
&& OB_FAIL(tablet_handle.get_obj()->check_schema_version_for_bounded_staleness_read(
param.schema_version_, data_max_schema_version, param.index_id_))) {
//check schema_version with ref_table_id, because schema_version of scan_param is from ref table
LOG_WARN("check schema version for bounded staleness read fail", K(ret), K(param));
//need to get store ctx of PG, cur_key_ saves the real partition
} else if (param.fb_snapshot_.is_min()) {
ret = OB_SNAPSHOT_DISCARDED;
} else {
const int64_t snapshot_version = store_ctx.mvcc_acc_ctx_.get_snapshot_version().get_val_for_tx();
const int64_t current_time = ObClockGenerator::getClock();
const int64_t timeout = param.timeout_ - current_time;
if (OB_UNLIKELY(timeout <= 0)) {
ret = OB_TIMEOUT;
LOG_WARN("table scan timeout", K(ret), K(current_time), "table_scan_param_timeout", param.timeout_, K(lbt()));
} else if (OB_FAIL(tablet_handle.get_obj()->check_snapshot_readable_with_cache(snapshot_version, timeout))) {
LOG_WARN("failed to check snapshot readable", K(ret), K(snapshot_version), K(timeout));
} else if (param.need_switch_param_) {
if (OB_FAIL(iter.switch_param(param, tablet_handle))) {
LOG_WARN("failed to init table scan iterator, ", K(ret));
}
} else if (OB_FAIL(iter.init(param, tablet_handle))) {
LOG_WARN("failed to init table scan iterator, ", K(ret));
}
}
if (OB_FAIL(ret)) {
LOG_WARN("failed to do table scan", K(ret), K(param), K(*this),
K(data_max_schema_version));
}
return ret;
}
int ObLSTabletService::has_tablet(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
bool &b_exist)
{
int ret = OB_SUCCESS;
b_exist = false;
const ObTabletMapKey key(ls_id, tablet_id);
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
if (OB_FAIL(t3m->has_tablet(key, b_exist))) {
LOG_WARN("failed to check tablet exist", K(ret), K(key));
}
return ret;
}
int ObLSTabletService::create_tablet(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
const common::ObTabletID &data_tablet_id,
const share::SCN &create_scn,
const int64_t snapshot_version,
const share::schema::ObTableSchema &table_schema,
const lib::Worker::CompatMode &compat_mode,
ObTabletHandle &tablet_handle)
{
int ret = OB_SUCCESS;
common::ObArenaAllocator tmp_allocator(common::ObMemAttr(MTL_ID(), "CreateTab"));
common::ObArenaAllocator *allocator = nullptr;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
const ObTabletMapKey key(ls_id, tablet_id);
ObTablet *tablet = nullptr;
ObFreezer *freezer = ls_->get_freezer();
bool need_create_empty_major_sstable = false;
tablet_handle.reset();
if (OB_FAIL(ObTabletCreateDeleteHelper::prepare_create_msd_tablet())) {
LOG_WARN("fail to prepare create msd tablet", K(ret));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash());
if (OB_FAIL(ObTabletCreateDeleteHelper::create_msd_tablet(key, tablet_handle))) {
LOG_WARN("failed to create msd tablet", K(ret), K(key));
} else if (OB_ISNULL(tablet = tablet_handle.get_obj())
|| OB_ISNULL(allocator = tablet_handle.get_allocator())) {
ret = OB_ERR_UNEXPECTED;
LOG_ERROR("new tablet is null", K(ret), KP(tablet), KP(allocator), K(tablet_handle));
} else if (OB_FAIL(ObTabletCreateDeleteHelper::check_need_create_empty_major_sstable(
table_schema, need_create_empty_major_sstable))) {
LOG_WARN("failed to check need create sstable", K(ret));
} else if (OB_FAIL(tablet->init_for_first_time_creation(*allocator, ls_id, tablet_id, data_tablet_id,
create_scn, snapshot_version, table_schema, compat_mode, need_create_empty_major_sstable, freezer))) {
LOG_WARN("failed to init tablet", K(ret), K(ls_id), K(tablet_id), K(data_tablet_id),
K(create_scn), K(snapshot_version), K(table_schema), K(compat_mode));
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) {
LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle));
} else if (OB_FAIL(tablet_id_set_.set(tablet_id))) {
LOG_WARN("fail to insert tablet id", K(ret), K(ls_id), K(tablet_id));
} else {
report_tablet_to_rs(tablet_id);
}
}
return ret;
}
int ObLSTabletService::create_inner_tablet(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
const common::ObTabletID &data_tablet_id,
const share::SCN &create_scn,
const int64_t snapshot_version,
const share::schema::ObTableSchema &table_schema,
const lib::Worker::CompatMode &compat_mode,
ObTabletHandle &tablet_handle)
{
int ret = OB_SUCCESS;
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "LSCreateTab"));
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
const ObTabletMapKey key(ls_id, tablet_id);
ObTablet *tmp_tablet = nullptr;
ObFreezer *freezer = ls_->get_freezer();
bool need_create_empty_major_sstable = false;
ObTabletHandle tmp_tablet_hdl;
ObMetaDiskAddr disk_addr;
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
if (OB_FAIL(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
LOG_WARN("failed to create temporary tablet", K(ret), K(key));
} else if (OB_ISNULL(tmp_tablet = tmp_tablet_hdl.get_obj())) {
ret = OB_ERR_UNEXPECTED;
LOG_ERROR("new tablet is null", K(ret), KPC(tmp_tablet), K(tmp_tablet_hdl));
} else if (OB_FAIL(ObTabletCreateDeleteHelper::check_need_create_empty_major_sstable(
table_schema, need_create_empty_major_sstable))) {
LOG_WARN("failed to check need create sstable", K(ret));
} else if (OB_FAIL(tmp_tablet->init_for_first_time_creation(allocator, ls_id, tablet_id, data_tablet_id,
create_scn, snapshot_version, table_schema, compat_mode, need_create_empty_major_sstable, freezer))) {
LOG_WARN("failed to init tablet", K(ret), K(ls_id), K(tablet_id), K(data_tablet_id),
K(create_scn), K(snapshot_version), K(table_schema), K(compat_mode));
int tmp_ret = OB_SUCCESS;
if (OB_TMP_FAIL(inner_remove_tablet(ls_id, tablet_id))) {
LOG_ERROR("failed to delete tablet from t3m", K(ret), K(key), K(lbt()));
ob_usleep(1000 * 1000);
ob_abort();
}
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), K(tmp_tablet_hdl), K(tablet_handle));
} else if (FALSE_IT(disk_addr = tablet_handle.get_obj()->get_tablet_addr())) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("failed to write update tablet slog", K(ret), K(tablet_handle));
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) {
LOG_WARN("failed to add tablet to meta mem mgr", K(ret), K(key), K(tablet_handle));
} else if (OB_FAIL(tablet_id_set_.set(tablet_id))) {
LOG_ERROR("fail to set tablet id set", K(ret), K(tablet_id), K(lbt()));
ob_usleep(1000 * 1000);
ob_abort();
} else {
LOG_INFO("create inner tablet success", K(key), K(disk_addr));
}
return ret;
}
int ObLSTabletService::create_transfer_in_tablet(
const share::ObLSID &ls_id,
const ObMigrationTabletParam &tablet_meta,
ObTabletHandle &tablet_handle)
{
int ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
const ObTabletMapKey key(ls_id, tablet_meta.tablet_id_);
ObTablet *tablet = nullptr;
ObFreezer *freezer = ls_->get_freezer();
common::ObArenaAllocator *allocator = nullptr;
ObTabletHandle old_tablet_hdl;
LOG_INFO("prepare to init transfer in tablet", K(ret), K(ls_id), K(tablet_meta));
ObTimeGuard time_guard("CreateTransferIn", 3_s);
bool cover_empty_shell = false;
if (!is_inited_) {
ret = OB_NOT_INIT;
LOG_WARN("ls tablet service do not init", K(ret));
} else if (!ls_id.is_valid() || !tablet_meta.is_valid()) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("create transfer in tablet get invalid argument", K(ret), K(ls_id), K(tablet_meta));
} else if (OB_FAIL(direct_get_tablet(tablet_meta.tablet_id_, old_tablet_hdl))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_SUCCESS;
LOG_DEBUG("tablet not exist", K(ret), K(tablet_meta.tablet_id_));
} else {
LOG_WARN("fail to get tablet", K(ret), K(tablet_meta.tablet_id_));
}
} else if (!old_tablet_hdl.get_obj()->is_empty_shell()) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("old tablet is not empty shell", K(ret), K(old_tablet_hdl));
} else if (FALSE_IT(cover_empty_shell = true)) {
// Called in mds trans callback, slog won't be written.
} else if (OB_FAIL(do_remove_tablet(key))) {
LOG_WARN("failed to remove tablet", K(ret), K(key));
}
time_guard.click("Prepare");
if (FAILEDx(ObTabletCreateDeleteHelper::prepare_create_msd_tablet())) {
LOG_WARN("failed to prepare create msd tablet", K(ret));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_meta.tablet_id_.hash());
time_guard.click("Lock");
if (FAILEDx(ObTabletCreateDeleteHelper::create_msd_tablet(key, tablet_handle))) {
LOG_WARN("failed to create msd tablet", K(ret), K(key));
} else if (OB_ISNULL(tablet = tablet_handle.get_obj())
|| OB_ISNULL(allocator = tablet_handle.get_allocator())) {
ret = OB_ERR_UNEXPECTED;
LOG_ERROR("new tablet is null", K(ret), KP(tablet), KP(allocator), K(tablet_handle));
} else if (OB_FAIL(tablet->init_with_migrate_param(*allocator, tablet_meta, false/*is_update*/, freezer))) {
LOG_WARN("failed to init tablet", K(ret), K(ls_id), K(tablet_meta));
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) {
LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle));
} else if (OB_FAIL(tablet_id_set_.set(tablet_meta.tablet_id_))) {
LOG_WARN("fail to insert tablet id", K(ret), K(ls_id), K(tablet_meta));
} else {
LOG_INFO("create transfer in tablet", K(ls_id), K(key), K(tablet_meta), K(cover_empty_shell));
time_guard.click("Swap");
}
}
return ret;
}
int ObLSTabletService::create_empty_shell_tablet(
const ObMigrationTabletParam &param,
ObTabletHandle &tablet_handle)
{
int ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
const share::ObLSID &ls_id = param.ls_id_;
const common::ObTabletID &tablet_id = param.tablet_id_;
const ObTabletMapKey key(ls_id, tablet_id);
ObTabletHandle old_tablet_hdl;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ls tablet svr hasn't been inited", K(ret));
} else if (OB_UNLIKELY(!key.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(key));
} else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_SUCCESS;
LOG_DEBUG("tablet not exist", K(ret), K(tablet_id));
} else {
LOG_WARN("fail to get tablet", K(ret), K(tablet_id));
}
} else if (OB_FAIL(remove_tablet(old_tablet_hdl))) {
LOG_WARN("failed to remove tablet", K(ret), K(key));
}
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); // must lock after prepare
common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "MigEmptyT"));
ObTabletHandle tmp_tablet_hdl;
if (FAILEDx(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tmp_tablet_hdl))) {
LOG_WARN("fail to create temporary tablet", K(ret), K(key));
} else {
ObFreezer *freezer = ls_->get_freezer();
ObTablet *tmp_tablet = tmp_tablet_hdl.get_obj();
ObTabletHandle tablet_handle;
ObTablet *new_tablet = nullptr;
ObMetaDiskAddr disk_addr;
if (OB_FAIL(tmp_tablet->init_with_migrate_param(allocator, param, false/*is_update*/, freezer))) {
LOG_WARN("failed to init tablet", K(ret), K(param));
} else if (OB_FAIL(ObTabletPersister::transform_empty_shell(*tmp_tablet, tablet_handle))) {
LOG_WARN("failed to transform empty shell", K(ret), KPC(tmp_tablet));
} else if (FALSE_IT(new_tablet = tablet_handle.get_obj())) {
} else if (OB_FAIL(ObTabletSlogHelper::write_empty_shell_tablet_slog(new_tablet, disk_addr))) {
LOG_WARN("fail to write emtpy shell tablet slog", K(ret), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(new_tablet->tablet_addr_ = disk_addr)) {
} else if (OB_FAIL(refresh_tablet_addr(ls_id, tablet_id, tablet_handle))) {
LOG_WARN("failed to refresh tablet addr", K(ret), K(ls_id), K(tablet_id), K(lbt()));
ob_usleep(1000 * 1000);
ob_abort();
} else {
ls_->get_tablet_gc_handler()->set_tablet_gc_trigger();
LOG_INFO("succeeded to create empty shell tablet", K(ret), K(key), K(param));
}
}
return ret;
}
int ObLSTabletService::rollback_tablet(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObLSHandle ls_handle;
ObLS *ls = nullptr;
ObTabletMapKey key(ls_id, tablet_id);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("ls tablet service do not init", K(ret));
} else if (OB_UNLIKELY(!ls_id.is_valid() || !tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("rollback tablet get invalid argument", K(ret), K(ls_id), K(tablet_id));
} else if (OB_FAIL(do_remove_tablet(key))) {
LOG_WARN("failed to delete tablet", K(ret), K(key));
} else if (OB_FAIL(tablet_id_set_.erase(key.tablet_id_))) {
if (OB_HASH_NOT_EXIST == ret) {
ret = OB_SUCCESS;
LOG_DEBUG("tablet id does not exist, maybe has not been inserted yet", K(ret), K(key));
} else {
//the caller checks abort if is required.
LOG_WARN("failed to erase tablet id", K(ret), K(key));
}
}
return ret;
}
int ObLSTabletService::create_memtable(
const common::ObTabletID &tablet_id,
const int64_t schema_version,
const bool for_replay,
const share::SCN clog_checkpoint_scn)
{
int ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObTabletHandle old_tablet_handle;
const ObTabletMapKey key(ls_->get_ls_id(), tablet_id);
ObTabletHandle new_tablet_handle;
ObTabletMemberWrapper<ObTabletTableStore> table_store;
ObTabletMemberWrapper<share::ObTabletAutoincSeq> autoinc_seq;
ObTimeGuard time_guard("ObLSTabletService::create_memtable", 10_ms);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || schema_version < 0)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(schema_version));
} else {
// we need bucket lock here to protect multi version tablet creation
// during tablet creating new memtable and put it into table store.
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) {
LOG_WARN("fail to get tablet", K(ret), K(tablet_id));
} else if (old_tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj());
} else {
time_guard.click("get tablet");
ObTablet &old_tablet = *(old_tablet_handle.get_obj());
if (OB_FAIL(old_tablet.create_memtable(schema_version, clog_checkpoint_scn, for_replay))) {
if (OB_MINOR_FREEZE_NOT_ALLOW != ret) {
LOG_WARN("fail to create memtable", K(ret), K(new_tablet_handle), K(schema_version), K(tablet_id));
}
} else if (FALSE_IT(time_guard.click("create memtable"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, old_tablet_handle))) {
LOG_WARN("fail to compare and swap tablet", K(ret), K(key), K(old_tablet_handle));
}
}
}
return ret;
}
int ObLSTabletService::check_allow_to_read(AllowToReadMgr::AllowToReadInfo &read_info)
{
int ret = OB_SUCCESS;
allow_to_read_mgr_.load_allow_to_read_info(read_info);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (!read_info.allow_to_read()) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_));
}
return ret;
}
int ObLSTabletService::check_read_info_same(const AllowToReadMgr::AllowToReadInfo &read_info)
{
int ret = OB_SUCCESS;
bool is_same = false;
allow_to_read_mgr_.check_read_info_same(read_info, is_same);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (!is_same) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_));
}
return ret;
}
int ObLSTabletService::get_read_tables(
const common::ObTabletID &tablet_id,
const int64_t snapshot_version,
ObTabletTableIterator &iter,
const bool allow_no_ready_read)
{
int ret = OB_SUCCESS;
ObTabletHandle &handle = iter.tablet_handle_;
iter.reset();
AllowToReadMgr::AllowToReadInfo read_info;
ObTabletMapKey key;
key.tablet_id_ = tablet_id;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || snapshot_version < 0)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(snapshot_version));
} else if (FALSE_IT(allow_to_read_mgr_.load_allow_to_read_info(read_info))) {
} else if (!read_info.allow_to_read()) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_));
} else if (FALSE_IT(key.ls_id_ = ls_->get_ls_id())) {
} else if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle,
ObTabletCommon::DEFAULT_GET_TABLET_DURATION_US,
ObMDSGetTabletMode::READ_READABLE_COMMITED,
snapshot_version))) {
if (OB_TABLET_NOT_EXIST != ret) {
LOG_WARN("fail to check and get tablet", K(ret), K(key), K(snapshot_version));
}
} else if (OB_UNLIKELY(!handle.is_valid())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected error, invalid tablet handle", K(ret), K(handle));
} else if (OB_FAIL(handle.get_obj()->get_read_tables(snapshot_version, iter,
allow_no_ready_read))) {
LOG_WARN("fail to get read tables", K(ret), K(handle), K(tablet_id), K(snapshot_version),
K(iter), K(allow_no_ready_read));
} else {
bool is_same = false;
allow_to_read_mgr_.check_read_info_same(read_info, is_same);
if (!is_same) {
ret = OB_REPLICA_NOT_READABLE;
LOG_WARN("ls is not allow to read", K(ret), KPC(ls_));
}
}
return ret;
}
int ObLSTabletService::set_tablet_status(
const common::ObTabletID &tablet_id,
const ObTabletCreateDeleteMdsUserData &tablet_status,
mds::MdsCtx &ctx)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || !tablet_status.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_status));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
ObTabletHandle tablet_handle;
if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_EAGAIN;
LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id));
} else {
LOG_WARN("fail to get tablet", K(ret));
}
} else if (OB_FAIL(tablet_handle.get_obj()->set_tablet_status(tablet_status, ctx))) {
LOG_WARN("fail to set tablet status", K(ret), K(tablet_id), K(tablet_status));
} else {
LOG_INFO("succeeded to set tablet status", K(ret), K(tablet_id), K(tablet_status));
}
}
return ret;
}
int ObLSTabletService::replay_set_tablet_status(
const common::ObTabletID &tablet_id,
const share::SCN &scn,
const ObTabletCreateDeleteMdsUserData &tablet_status,
mds::MdsCtx &ctx)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || !tablet_status.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_status));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
ObTabletHandle tablet_handle;
if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_EAGAIN;
LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id));
} else {
LOG_WARN("fail to get tablet", K(ret));
}
} else if (OB_FAIL(tablet_handle.get_obj()->replay_set_tablet_status(scn, tablet_status, ctx))) {
LOG_WARN("fail to replay set tablet status", K(ret), K(tablet_id), K(scn), K(tablet_status));
} else {
LOG_INFO("succeeded to replay set tablet status", K(ret), K(tablet_id), K(scn), K(tablet_status));
}
}
return ret;
}
int ObLSTabletService::set_ddl_info(
const common::ObTabletID &tablet_id,
const ObTabletBindingMdsUserData &ddl_data,
mds::MdsCtx &ctx,
const int64_t timeout_us)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(ddl_data));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
ObTabletHandle tablet_handle;
if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_EAGAIN;
LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id));
} else {
LOG_WARN("fail to get tablet", K(ret));
}
} else if (OB_FAIL(tablet_handle.get_obj()->set_ddl_info(ddl_data, ctx, timeout_us))) {
LOG_WARN("fail to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(timeout_us));
} else {
LOG_INFO("succeeded to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(timeout_us));
}
}
return ret;
}
int ObLSTabletService::replay_set_ddl_info(
const common::ObTabletID &tablet_id,
const share::SCN &scn,
const ObTabletBindingMdsUserData &ddl_data,
mds::MdsCtx &ctx)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(ddl_data));
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
ObTabletHandle tablet_handle;
if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) {
if (OB_TABLET_NOT_EXIST == ret) {
ret = OB_EAGAIN;
LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id));
} else {
LOG_WARN("fail to get tablet", K(ret));
}
} else if (OB_FAIL(tablet_handle.get_obj()->replay_set_ddl_info(scn, ddl_data, ctx))) {
LOG_WARN("fail to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(scn));
} else {
LOG_INFO("succeeded to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(scn));
}
}
return ret;
}
int ObLSTabletService::build_create_sstable_param_for_migration(
const blocksstable::ObMigrationSSTableParam &mig_param,
ObTabletCreateSSTableParam &param)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!mig_param.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(mig_param));
} else {
param.table_key_ = mig_param.table_key_;
param.schema_version_ = mig_param.basic_meta_.schema_version_;
param.create_snapshot_version_ = mig_param.basic_meta_.create_snapshot_version_;
param.progressive_merge_round_ = mig_param.basic_meta_.progressive_merge_round_;
param.progressive_merge_step_ = mig_param.basic_meta_.progressive_merge_step_;
param.is_ready_for_read_ = false;
param.table_mode_ = mig_param.basic_meta_.table_mode_;
param.index_type_ = static_cast<share::schema::ObIndexType>(mig_param.basic_meta_.index_type_);
param.rowkey_column_cnt_ = mig_param.basic_meta_.rowkey_column_count_;
param.root_row_store_type_ = mig_param.basic_meta_.root_row_store_type_;
param.latest_row_store_type_ = mig_param.basic_meta_.latest_row_store_type_;
param.index_blocks_cnt_ = mig_param.basic_meta_.index_macro_block_count_;
param.data_blocks_cnt_ = mig_param.basic_meta_.data_macro_block_count_;
param.micro_block_cnt_ = mig_param.basic_meta_.data_micro_block_count_;
param.use_old_macro_block_count_ = mig_param.basic_meta_.use_old_macro_block_count_;
param.row_count_ = mig_param.basic_meta_.row_count_;
param.column_cnt_ = mig_param.basic_meta_.column_cnt_;
param.data_checksum_ = mig_param.basic_meta_.data_checksum_;
param.occupy_size_ = mig_param.basic_meta_.occupy_size_;
param.original_size_ = mig_param.basic_meta_.original_size_;
param.max_merged_trans_version_ = mig_param.basic_meta_.max_merged_trans_version_;
param.ddl_scn_ = mig_param.basic_meta_.ddl_scn_;
param.filled_tx_scn_ = mig_param.basic_meta_.filled_tx_scn_;
param.contain_uncommitted_row_ = mig_param.basic_meta_.contain_uncommitted_row_;
param.compressor_type_ = mig_param.basic_meta_.compressor_type_;
param.encrypt_id_ = mig_param.basic_meta_.encrypt_id_;
param.master_key_id_ = mig_param.basic_meta_.master_key_id_;
MEMCPY(param.encrypt_key_, mig_param.basic_meta_.encrypt_key_, share::OB_MAX_TABLESPACE_ENCRYPT_KEY_LENGTH);
param.root_block_addr_.set_none_addr();
param.data_block_macro_meta_addr_.set_none_addr();;
if (OB_FAIL(param.column_checksums_.assign(mig_param.column_checksums_))) {
LOG_WARN("fail to assign column checksums", K(ret), K(mig_param));
}
}
return ret;
}
int ObLSTabletService::insert_rows(
ObTabletHandle &tablet_handle,
ObStoreCtx &ctx,
const ObDMLBaseParam &dml_param,
const common::ObIArray<uint64_t> &column_ids,
common::ObNewRowIterator *row_iter,
int64_t &affected_rows)
{
int ret = OB_SUCCESS;
NG_TRACE(S_insert_rows_begin);
int64_t afct_num = 0;
int64_t dup_num = 0;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!ctx.is_valid())
|| !ctx.is_write()
|| OB_UNLIKELY(!dml_param.is_valid())
|| OB_UNLIKELY(column_ids.count() <= 0)
|| OB_ISNULL(row_iter)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param), K(column_ids), KP(row_iter));
} else if (dml_param.is_direct_insert()) { // direct-insert mode
const ObTableSchemaParam::Columns &columns = dml_param.table_param_->get_data_table().get_columns();
bool is_heap_table = columns.at(0)->is_hidden();
if (OB_FAIL(direct_insert_rows(dml_param.table_param_->get_data_table().get_table_id(),
dml_param.direct_insert_task_id_,
ctx.tablet_id_,
is_heap_table,
row_iter,
afct_num))) {
LOG_WARN("failed to insert rows direct", KR(ret),
K(dml_param.table_param_->get_data_table().get_table_id()),
K(dml_param.direct_insert_task_id_),
K(ctx.tablet_id_),
K(is_heap_table));
}
} else {
ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID());
ObDMLRunningCtx run_ctx(ctx,
dml_param,
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
lob_allocator,
ObDmlFlag::DF_INSERT);
ObIAllocator &work_allocator = run_ctx.allocator_;
void *ptr = nullptr;
ObStoreRow *tbl_rows = nullptr;
int64_t row_count = 0;
bool first_bulk = true;
ObNewRow *rows = nullptr;
if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) {
LOG_WARN("failed to prepare dml running ctx", K(ret));
} else {
ObTabletHandle tmp_handle;
SMART_VAR(ObRowsInfo, rows_info) {
const ObRelativeTable &data_table = run_ctx.relative_table_;
while (OB_SUCC(ret) && OB_SUCC(get_next_rows(row_iter, rows, row_count))) {
ObStoreRow reserved_row;
// Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle
// outside the while loop.
if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) {
tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle();
rows_info.reset();
if (OB_FAIL(rows_info.init(data_table, ctx, tmp_handle.get_obj()->get_rowkey_read_info()))) {
LOG_WARN("Failed to init rows info", K(ret), K(data_table));
}
}
if (OB_FAIL(ret)) {
} else if (row_count <= 0) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("row_count should be greater than 0", K(ret));
} else if (1 == row_count) {
tbl_rows = &reserved_row;
tbl_rows[0].flag_.set_flag(ObDmlFlag::DF_INSERT);
} else if (first_bulk) {
first_bulk = false;
if (OB_ISNULL(ptr = work_allocator.alloc(row_count * sizeof(ObStoreRow)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_ERROR("fail to allocate memory", K(ret), K(row_count));
} else {
tbl_rows = new (ptr) ObStoreRow[row_count];
for (int64_t i = 0; i < row_count; i++) {
tbl_rows[i].flag_.set_flag(ObDmlFlag::DF_INSERT);
}
}
}
if (OB_FAIL(ret)) {
} else if (OB_ISNULL(tbl_rows)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected error, tbl_rows is NULL", K(ret), KP(tbl_rows));
} else if (OB_FAIL(insert_rows_to_tablet(tablet_handle, run_ctx, rows,
row_count, rows_info, tbl_rows, afct_num, dup_num))) {
LOG_WARN("insert to each tablets fail", K(ret));
}
}
} else {
LOG_WARN("Failed to allocate ObRowsInfo", K(ret));
}
lob_allocator.reuse();
}
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
}
if (nullptr != ptr) {
work_allocator.free(ptr);
}
lob_allocator.reset();
}
if (OB_SUCC(ret)) {
LOG_DEBUG("succeeded to insert rows", K(ret));
affected_rows = afct_num;
EVENT_ADD(STORAGE_INSERT_ROW_COUNT, afct_num);
}
NG_TRACE(S_insert_rows_end);
return ret;
}
int ObLSTabletService::direct_insert_rows(
const uint64_t table_id,
const int64_t task_id,
const ObTabletID &tablet_id,
const bool is_heap_table,
ObNewRowIterator *row_iter,
int64_t &affected_rows)
{
int ret = OB_SUCCESS;
ObTableLoadTableCtx *table_ctx = nullptr;
ObTableLoadKey key(MTL_ID(), table_id);
if (OB_FAIL(ObTableLoadService::get_ctx(key, table_ctx))) {
LOG_WARN("fail to get table ctx", KR(ret), K(key));
} else {
int64_t row_count = 0;
ObNewRow *rows = nullptr;
table::ObTableLoadTransId trans_id;
trans_id.segment_id_ = task_id;
trans_id.trans_gid_ = 1;
ObTableLoadStore store(table_ctx);
if (OB_FAIL(store.init())) {
LOG_WARN("fail to init store", KR(ret));
}
while (OB_SUCC(ret) && OB_SUCC(get_next_rows(row_iter, rows, row_count))) {
if (row_count <= 0) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("row_count should be greater than 0", K(ret));
} else {
common::ObArray<ObNewRow> row_array;
for (int64_t i = 0; OB_SUCC(ret) && (i < row_count); ++i) {
ObNewRow new_row;
if (is_heap_table) {
new_row.assign(rows[i].cells_ + 1, rows[i].count_ - 1);
} else {
new_row.assign(rows[i].cells_, rows[i].count_);
}
if (OB_FAIL(row_array.push_back(new_row))) {
LOG_WARN("failed to push back row to row_array", KR(ret), K(i), K(new_row));
}
}
if (OB_SUCC(ret)) {
if (OB_FAIL(store.px_write(trans_id, tablet_id, row_array))) {
LOG_WARN("failed to write to store", KR(ret), K(trans_id),
K(table_id), K(tablet_id), K(row_array));
} else {
affected_rows += row_count;
}
}
}
}
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
}
}
if (OB_NOT_NULL(table_ctx)) {
ObTableLoadService::put_ctx(table_ctx);
table_ctx = nullptr;
}
return ret;
}
int ObLSTabletService::insert_row(
ObTabletHandle &tablet_handle,
ObStoreCtx &ctx,
const ObDMLBaseParam &dml_param,
const common::ObIArray<uint64_t> &column_ids,
const common::ObIArray<uint64_t> &duplicated_column_ids,
const common::ObNewRow &row,
const ObInsertFlag flag,
int64_t &affected_rows,
common::ObNewRowIterator *&duplicated_rows)
{
int ret = OB_SUCCESS;
const ObTabletID &data_tablet_id = ctx.tablet_id_;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!ctx.is_valid()
|| !ctx.is_write()
|| !dml_param.is_valid()
|| column_ids.count() <= 0
|| duplicated_column_ids.count() <= 0
|| !row.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param),
K(column_ids), K(duplicated_column_ids), K(row), K(flag));
} else {
ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID());
ObDMLRunningCtx run_ctx(ctx,
dml_param,
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
lob_allocator,
ObDmlFlag::DF_INSERT);
ObIAllocator &work_allocator = run_ctx.allocator_;
duplicated_rows = nullptr;
ObStoreRow &tbl_row = run_ctx.tbl_row_;
const ObRelativeTable &data_table = run_ctx.relative_table_;
if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) {
LOG_WARN("failed to prepare dml running ctx", K(ret));
} else {
tbl_row.flag_.set_flag(ObDmlFlag::DF_INSERT);
tbl_row.row_val_ = row;
if (OB_FAIL(get_conflict_rows(tablet_handle,
run_ctx,
flag,
duplicated_column_ids,
tbl_row.row_val_,
duplicated_rows))) {
LOG_WARN("failed to get conflict row(s)", K(ret), K(duplicated_column_ids), K(row));
} else if (nullptr == duplicated_rows) {
if (OB_FAIL(insert_row_to_tablet(tablet_handle, run_ctx, tbl_row))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret) {
LOG_WARN("failed to write row", K(ret));
}
} else {
LOG_DEBUG("succeeded to insert row", K(ret), K(row));
affected_rows = 1;
EVENT_INC(STORAGE_INSERT_ROW_COUNT);
}
} else {
ret = OB_ERR_PRIMARY_KEY_DUPLICATE;
}
}
lob_allocator.reset();
}
return ret;
}
static inline
bool is_lob_update(ObDMLRunningCtx &run_ctx, const ObIArray<int64_t> &update_idx)
{
bool bool_ret = false;
for (int64_t i = 0; i < update_idx.count() && !bool_ret; ++i) {
int64_t idx = update_idx.at(i);
if (run_ctx.col_descs_->at(idx).col_type_.is_lob_storage()) {
bool_ret = true;
}
}
return bool_ret;
}
int ObLSTabletService::update_rows(
ObTabletHandle &tablet_handle,
ObStoreCtx &ctx,
const ObDMLBaseParam &dml_param,
const ObIArray<uint64_t> &column_ids,
const ObIArray< uint64_t> &updated_column_ids,
ObNewRowIterator *row_iter,
int64_t &affected_rows)
{
int ret = OB_SUCCESS;
NG_TRACE(S_update_rows_begin);
const ObTabletID &data_tablet_id = ctx.tablet_id_;
int64_t afct_num = 0;
int64_t dup_num = 0;
int64_t got_row_count = 0;
ObTimeGuard timeguard(__func__, 3 * 1000 * 1000);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!ctx.is_valid()
|| !ctx.is_write()
|| !dml_param.is_valid()
|| column_ids.count() <= 0
|| updated_column_ids.count() <= 0
|| nullptr == row_iter)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param),
K(column_ids), K(updated_column_ids), KP(row_iter));
} else {
timeguard.click("Get");
ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID());
ObDMLRunningCtx run_ctx(ctx,
dml_param,
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
lob_allocator,
ObDmlFlag::DF_UPDATE);
ObIAllocator &work_allocator = run_ctx.allocator_;
ObStoreRow old_tbl_row;
void *old_row_cells = nullptr;
ObStoreRow &new_tbl_row = run_ctx.tbl_row_;
bool rowkey_change = false;
UpdateIndexArray update_idx;
ObRowStore row_store;
bool delay_new = false;
bool lob_update = false;
const ObRelativeTable &relative_table = run_ctx.relative_table_;
if (OB_FAIL(prepare_dml_running_ctx(&column_ids, &updated_column_ids, tablet_handle, run_ctx))) {
LOG_WARN("failed to prepare dml running ctx", K(ret));
} else if (FALSE_IT(tablet_handle.reset())) {
} else if (FALSE_IT(timeguard.click("Prepare"))) {
} else if (OB_UNLIKELY(!relative_table.is_valid())) {
ret = OB_ERR_SYS;
LOG_ERROR("data table is not prepared", K(ret));
} else if (OB_FAIL(construct_update_idx(relative_table.get_rowkey_column_num(),
run_ctx.col_map_,
updated_column_ids, update_idx))) {
LOG_WARN("failed to construct update_idx", K(ret), K(updated_column_ids));
} else if (FALSE_IT(timeguard.click("Construct"))) {
} else if (OB_FAIL(check_rowkey_change(updated_column_ids, relative_table, rowkey_change, delay_new))) {
LOG_WARN("failed to check rowkey changes", K(ret));
} else {
timeguard.click("Check");
const int64_t num = relative_table.get_column_count();
if (OB_ISNULL(old_row_cells = work_allocator.alloc(
static_cast<int64_t>(sizeof(common::ObObj) * num)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_ERROR("failed to malloc temp row cells", K(ret));
} else {
timeguard.click("AllocOld");
old_tbl_row.row_val_.cells_ = new (old_row_cells) ObObj[num]();
old_tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE);
new_tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE);
}
lob_update = is_lob_update(run_ctx, update_idx);
}
int64_t cur_time = 0;
ObTabletHandle tmp_handle;
while (OB_SUCC(ret)
&& OB_SUCC(get_next_row_from_iter(row_iter, old_tbl_row, true))
&& OB_SUCC(get_next_row_from_iter(row_iter, new_tbl_row, false))) {
LOG_DEBUG("get_dml_update_row", KP(row_iter), K(old_tbl_row), K(new_tbl_row));
// Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle
// outside the while loop.
if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) {
tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle();
}
bool duplicate = false;
++got_row_count;
cur_time = ObClockGenerator::getClock();
if ((0 == (0x1FF & got_row_count)) && (cur_time > dml_param.timeout_)) {
//checking timeout cost too much, so check every 512 rows
ret = OB_TIMEOUT;
LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret));
} else if (OB_FAIL(update_row_to_tablet(tmp_handle,
run_ctx,
rowkey_change,
update_idx,
delay_new,
lob_update,
old_tbl_row,
new_tbl_row,
&row_store,
duplicate))) {
LOG_WARN("failed to update row to tablets", K(ret), K(old_tbl_row), K(new_tbl_row));
} else if (duplicate) {
dup_num++;
} else {
afct_num++;
}
lob_allocator.reuse();
timeguard.click("Update");
}
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
}
if (OB_SUCC(ret) && row_store.get_row_count() > 0) {
void *ptr1 = nullptr;
const int64_t num = relative_table.get_column_count();
if (OB_ISNULL(ptr1 = work_allocator.alloc(sizeof(common::ObObj) * num))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_ERROR("failed to malloc temp row cells", K(ret));
} else {
timeguard.click("AllocNew");
new_tbl_row.row_val_.cells_ = new(ptr1) ObObj[num]();
ObRowStore::Iterator row_iter2 = row_store.begin();
ObTabletHandle tmp_handle;
// when total_quantity_log is true, we should iterate new_tbl_row and old_tbl_row, and
// dispose these two rows together, otherwise, when total_quantity_log is false,
// row_iter2 doesn't contain old rows, and old_tbl_row is a dummy param in process_new_row
while (OB_SUCC(ret) && OB_SUCC(row_iter2.get_next_row(new_tbl_row.row_val_))) {
// Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle
// outside the while loop.
if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) {
tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle();
}
int64_t data_tbl_rowkey_len = relative_table.get_rowkey_column_num();
bool tbl_rowkey_change = false;
if (OB_FAIL(row_iter2.get_next_row(old_tbl_row.row_val_))) {
LOG_WARN("fail to get row from row stores", K(ret));
} else if (FALSE_IT(timeguard.click("GetNext"))) {
} else if (rowkey_change && OB_FAIL(check_rowkey_value_change(old_tbl_row.row_val_,
new_tbl_row.row_val_,
data_tbl_rowkey_len,
tbl_rowkey_change))) {
LOG_WARN("check data table rowkey change failed", K(ret), K(old_tbl_row),
K(new_tbl_row), K(data_tbl_rowkey_len));
} else if (OB_FAIL(process_new_row(tmp_handle,
run_ctx,
update_idx,
old_tbl_row,
new_tbl_row,
tbl_rowkey_change))) {
LOG_WARN("fail to process new row", K(ret), K(old_tbl_row), K(new_tbl_row));
}
timeguard.click("Process");
}
work_allocator.free(ptr1);
ptr1 = nullptr;
new_tbl_row.row_val_.cells_ = nullptr;
}
}
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
}
if (nullptr != old_row_cells) {
work_allocator.free(old_row_cells);
}
lob_allocator.reset();
old_tbl_row.row_val_.cells_ = nullptr;
if (OB_SUCC(ret)) {
affected_rows = afct_num;
EVENT_ADD(STORAGE_UPDATE_ROW_COUNT, afct_num);
}
if (timeguard.get_diff() > 3 * 1000 * 1000) {
LOG_WARN_RET(OB_ERR_TOO_MUCH_TIME, "update rows use too much time", K(afct_num), K(got_row_count));
}
}
NG_TRACE(S_update_rows_end);
return ret;
}
int ObLSTabletService::put_rows(
ObTabletHandle &tablet_handle,
ObStoreCtx &ctx,
const ObDMLBaseParam &dml_param,
const ObIArray<uint64_t> &column_ids,
ObNewRowIterator *row_iter,
int64_t &affected_rows)
{
int ret = OB_SUCCESS;
const ObTabletID &data_tablet_id = ctx.tablet_id_;
int64_t afct_num = 0;
ObTimeGuard timeguard(__func__, 3 * 1000 * 1000);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!ctx.is_valid())
|| OB_UNLIKELY(!ctx.is_write())
|| OB_UNLIKELY(!dml_param.is_valid())
|| OB_UNLIKELY(column_ids.count() <= 0)
|| OB_ISNULL(row_iter)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param), K(column_ids), KP(row_iter));
} else {
ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID());
ObDMLRunningCtx run_ctx(ctx,
dml_param,
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
lob_allocator,
ObDmlFlag::DF_UPDATE);
ObIAllocator &work_allocator = run_ctx.allocator_;
ObNewRow *row = nullptr;
ObStoreRow &tbl_row = run_ctx.tbl_row_;
const ObRelativeTable &data_table = run_ctx.relative_table_;
if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) {
LOG_WARN("failed to prepare dml running ctx", K(ret));
} else {
tablet_handle.reset();
tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE);
}
int64_t cur_time = 0;
ObTabletHandle tmp_handle;
while (OB_SUCC(ret) && OB_SUCC(row_iter->get_next_row(row))) {
// Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle
// outside the while loop.
if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) {
tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle();
}
cur_time = ObClockGenerator::getClock();
tbl_row.row_val_ = *row;
if (cur_time > dml_param.timeout_) {
ret = OB_TIMEOUT;
LOG_WARN("query timeout", K(ret), K(cur_time), K(dml_param));
} else if (OB_FAIL(insert_row_to_tablet(tmp_handle, run_ctx, tbl_row))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("failed to write row", K(ret));
}
}
++afct_num;
lob_allocator.reuse();
}
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
}
lob_allocator.reset();
if (OB_SUCC(ret)) {
affected_rows = afct_num;
EVENT_ADD(STORAGE_INSERT_ROW_COUNT, afct_num);
}
}
return ret;
}
int ObLSTabletService::delete_rows(
ObTabletHandle &tablet_handle,
ObStoreCtx &ctx,
const ObDMLBaseParam &dml_param,
const ObIArray<uint64_t> &column_ids,
ObNewRowIterator *row_iter,
int64_t &affected_rows)
{
int ret = OB_SUCCESS;
NG_TRACE(S_delete_rows_begin);
const ObTabletID &data_tablet_id = ctx.tablet_id_;
ObRowReshape *row_reshape = nullptr;
int64_t afct_num = 0;
ObTimeGuard timeguard(__func__, 3 * 1000 * 1000);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_ISNULL(row_iter) || !ctx.is_valid() || !ctx.is_write()
|| column_ids.count() <= 0 || OB_ISNULL(row_iter)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(dml_param), K(column_ids),
KP(row_iter), K(ctx));
} else {
ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID());
ObDMLRunningCtx run_ctx(ctx,
dml_param,
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
lob_allocator,
ObDmlFlag::DF_DELETE);
ObNewRow *row = nullptr;
if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) {
LOG_WARN("failed to prepare dml running ctx", K(ret));
} else {
tablet_handle.reset();
}
// delete table rows
int64_t cur_time = 0;
ObTabletHandle tmp_handle;
while (OB_SUCC(ret) && OB_SUCC(row_iter->get_next_row(row))) {
// Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle
// outside the while loop.
if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) {
tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle();
}
cur_time = ObClockGenerator::getClock();
if (cur_time > run_ctx.dml_param_.timeout_) {
ret = OB_TIMEOUT;
LOG_WARN("query timeout", K(cur_time), K(run_ctx.dml_param_), K(ret));
} else if (OB_ISNULL(row)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("get next row from iterator failed", KP(row), K(ret));
} else if (OB_FAIL(delete_row_in_tablet(tmp_handle, run_ctx, *row))) {
LOG_WARN("fail to delete row", K(ret), K(row));
} else {
++afct_num;
}
lob_allocator.reuse();
}
lob_allocator.reset();
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
}
if (OB_SUCC(ret)) {
affected_rows = afct_num;
EVENT_ADD(STORAGE_DELETE_ROW_COUNT, afct_num);
}
}
NG_TRACE(S_delete_rows_end);
return ret;
}
int ObLSTabletService::lock_rows(
ObTabletHandle &tablet_handle,
ObStoreCtx &ctx,
const ObDMLBaseParam &dml_param,
const int64_t abs_lock_timeout,
const ObLockFlag lock_flag,
const bool is_sfu,
ObNewRowIterator *row_iter,
int64_t &affected_rows)
{
UNUSEDx(lock_flag, is_sfu);
NG_TRACE(S_lock_rows_begin);
int ret = OB_SUCCESS;
const ObTabletID &data_tablet_id = ctx.tablet_id_;
ObTimeGuard timeguard(__func__, 3 * 1000 * 1000);
int64_t afct_num = 0;
ObColDescArray col_desc;
common::ObSEArray<uint64_t, 1> column_ids;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("tablet service is not initialized", K(ret));
} else if (OB_UNLIKELY(!ctx.is_valid()
|| !ctx.is_write()
|| !dml_param.is_valid()
|| OB_ISNULL(row_iter))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(ctx), K(dml_param), KPC(row_iter));
} else {
timeguard.click("Get");
ObDMLRunningCtx run_ctx(ctx,
dml_param,
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
ObDmlFlag::DF_LOCK);
ObNewRow *row = nullptr;
if (OB_FAIL(prepare_dml_running_ctx(nullptr, nullptr, tablet_handle, run_ctx))) {
LOG_WARN("failed to prepare dml running ctx", K(ret));
} else if (FALSE_IT(tablet_handle.reset())) {
} else if (FALSE_IT(timeguard.click("Prepare"))) {
} else if (OB_FAIL(run_ctx.relative_table_.get_rowkey_column_ids(col_desc))) {
LOG_WARN("Fail to get column desc", K(ret));
} else if (OB_FAIL(run_ctx.relative_table_.get_rowkey_column_ids(column_ids))) {
LOG_WARN("Fail to get column ids", K(ret));
} else {
timeguard.click("GetIds");
run_ctx.column_ids_ = &column_ids;
ctx.mvcc_acc_ctx_.abs_lock_timeout_ =
ObTablet::get_lock_wait_timeout(abs_lock_timeout, dml_param.timeout_);
ObTabletHandle tmp_handle;
while (OB_SUCCESS == ret && OB_SUCC(row_iter->get_next_row(row))) {
// Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle
// outside the while loop.
if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) {
tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle();
}
ObRelativeTable &relative_table = run_ctx.relative_table_;
bool is_exists = true;
if (ObTimeUtility::current_time() > dml_param.timeout_) {
ret = OB_TIMEOUT;
int64_t cur_time = ObClockGenerator::getClock();
LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret));
} else if (GCONF.enable_defensive_check()
&& OB_FAIL(check_old_row_legitimacy(tmp_handle, run_ctx, *row))) {
LOG_WARN("check row legitimacy failed", K(ret), KPC(row));
} else if (GCONF.enable_defensive_check()
&& OB_FAIL(check_new_row_nullable_value(col_desc, relative_table, *row))) {
LOG_WARN("check lock row nullable failed", K(ret));
} else if (FALSE_IT(timeguard.click("Check"))) {
} else if (OB_FAIL(tmp_handle.get_obj()->lock_row(run_ctx.relative_table_, ctx, *row))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret) {
LOG_WARN("failed to lock row", K(*row), K(ret));
}
} else {
++afct_num;
}
timeguard.click("Lock");
}
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
affected_rows = afct_num;
}
}
}
NG_TRACE(S_lock_rows_end);
return ret;
}
int ObLSTabletService::lock_row(
ObTabletHandle &tablet_handle,
ObStoreCtx &ctx,
const ObDMLBaseParam &dml_param,
const int64_t abs_lock_timeout,
const ObNewRow &row,
const ObLockFlag lock_flag,
const bool is_sfu)
{
UNUSEDx(lock_flag, is_sfu);
int ret = OB_SUCCESS;
const ObTabletID &data_tablet_id = ctx.tablet_id_;
ObTimeGuard timeguard(__func__, 3 * 1000 * 1000);
int64_t afct_num = 0;
ObColDescArray col_desc;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("tablet service is not initialized", K(ret));
} else if (OB_UNLIKELY(!ctx.is_valid() || !dml_param.is_valid() || !row.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(ctx), K(dml_param), K(row));
} else {
ObDMLRunningCtx run_ctx(ctx,
dml_param,
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(),
ObDmlFlag::DF_LOCK);
if (OB_FAIL(prepare_dml_running_ctx(nullptr, nullptr, tablet_handle, run_ctx))) {
LOG_WARN("failed to prepare dml running ctx", K(ret));
} else if (OB_FAIL(run_ctx.relative_table_.get_rowkey_column_ids(col_desc))) {
LOG_WARN("Fail to get column desc", K(ret));
} else {
ctx.mvcc_acc_ctx_.abs_lock_timeout_ =
ObTablet::get_lock_wait_timeout(abs_lock_timeout, dml_param.timeout_);
if (ObTimeUtility::current_time() > dml_param.timeout_) {
ret = OB_TIMEOUT;
int64_t cur_time = ObClockGenerator::getClock();
LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret));
} else if (OB_FAIL(tablet_handle.get_obj()->lock_row(run_ctx.relative_table_, ctx, row))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret) {
LOG_WARN("failed to lock row", K(row), K(ret));
}
} else {
++afct_num;
}
}
}
return ret;
}
int ObLSTabletService::trim_rebuild_tablet(
const ObTabletID &tablet_id,
const bool is_rollback)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(is_stopped_)) {
ret = OB_NOT_RUNNING;
LOG_WARN("tablet service stopped", K(ret));
} else if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(tablet_id));
} else if (is_rollback && OB_FAIL(rollback_rebuild_tablet(tablet_id))) {
LOG_WARN("failed to rollback tablet rebuilt", K(ret), K(is_rollback), K(tablet_id));
} else if (!is_rollback && OB_FAIL(trim_old_tablets(tablet_id))) {
LOG_WARN("failed to trim old tablets", K(ret), K(is_rollback), K(tablet_id));
}
return ret;
}
int ObLSTabletService::create_or_update_migration_tablet(
const ObMigrationTabletParam &mig_tablet_param,
const bool is_transfer)
{
// TODO: is_transfer may be redundant, temporarily unused
UNUSEDx(is_transfer);
int ret = OB_SUCCESS;
const share::ObLSID &ls_id = mig_tablet_param.ls_id_;
const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_;
ObTabletHandle tablet_handle;
bool b_exist = false;
const bool need_create_msd_tablet = mig_tablet_param.is_empty_shell();
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(is_stopped_)) {
ret = OB_NOT_RUNNING;
LOG_WARN("tablet service stopped", K(ret));
} else if (!mig_tablet_param.is_empty_shell()
&& (OB_UNLIKELY(!mig_tablet_param.is_valid())
|| OB_UNLIKELY(ls_id != ls_->get_ls_id()))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(mig_tablet_param), K_(ls));
} else if (need_create_msd_tablet) {
if (OB_FAIL(create_empty_shell_tablet(mig_tablet_param, tablet_handle))) {
LOG_WARN("failed to create empty shell tablet", K(ret), K(tablet_id), K(mig_tablet_param));
}
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) {
LOG_WARN("failed to check tablet existence", K(ls_id), K(tablet_id));
} else if (b_exist
&& OB_FAIL(migrate_update_tablet(mig_tablet_param))) {
LOG_WARN("failed to update tablet meta", K(ret), K(tablet_id), K(mig_tablet_param));
} else if (!b_exist
&& OB_FAIL(migrate_create_tablet(mig_tablet_param, tablet_handle))) {
LOG_WARN("failed to migrate create tablet", K(ret), K(mig_tablet_param));
}
}
return ret;
}
int ObLSTabletService::rebuild_create_tablet(
const ObMigrationTabletParam &mig_tablet_param,
const bool keep_old)
{
int ret = OB_SUCCESS;
const share::ObLSID &ls_id = mig_tablet_param.ls_id_;
const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_;
const ObTabletMapKey key(ls_id, tablet_id);
bool b_exist = false;
const bool need_create_msd_tablet = mig_tablet_param.is_empty_shell() && !keep_old;
ObTabletHandle new_tablet_handle;
ObTabletHandle old_tablet_handle;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(is_stopped_)) {
ret = OB_NOT_RUNNING;
LOG_WARN("tablet service stopped", K(ret));
} else if (OB_UNLIKELY(!mig_tablet_param.is_valid())
|| OB_UNLIKELY(ls_id != ls_->get_ls_id())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(mig_tablet_param), K_(ls));
} else if (OB_UNLIKELY(mig_tablet_param.is_empty_shell() && keep_old)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected error, rebuild create an empty shell tablet, but still need the old tablet", K(ret),
K(mig_tablet_param), K(keep_old));
} else if (need_create_msd_tablet) {
if (OB_FAIL(create_empty_shell_tablet(mig_tablet_param, new_tablet_handle))) {
LOG_WARN("failed to create empty shell tablet", K(ret), K(tablet_id), K(mig_tablet_param));
}
} else {
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) {
LOG_WARN("fail to check tablet existence", K(ls_id), K(tablet_id));
} else if (!b_exist &&
OB_FAIL(migrate_create_tablet(mig_tablet_param, new_tablet_handle))) {
LOG_WARN("failed to rebuild create tablet", K(ret), K(tablet_id), K(mig_tablet_param));
} else if (b_exist && !keep_old &&
OB_FAIL(migrate_update_tablet(mig_tablet_param))) {
LOG_WARN("failed to rebuild create tablet", K(ret), K(tablet_id), K(mig_tablet_param));
} else if (b_exist && keep_old) {
if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, old_tablet_handle,
ObTabletCommon::DEFAULT_GET_TABLET_DURATION_US,
ObMDSGetTabletMode::READ_WITHOUT_CHECK,
ObTransVersion::MAX_TRANS_VERSION))) {
LOG_WARN("failed to check and get tablet", K(ret), K(key));
} else if (OB_UNLIKELY(old_tablet_handle.get_obj()->get_tablet_meta().has_next_tablet_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("number of nodes on list exceeds 2", K(ret));
} else if (OB_FAIL(rebuild_tablet_with_old(mig_tablet_param, old_tablet_handle))) {
LOG_WARN("failed to rebuild tablet and maintain linked list", K(ret), K(tablet_id));
}
}
}
return ret;
}
int ObLSTabletService::build_ha_tablet_new_table_store(
const ObTabletID &tablet_id,
const ObBatchUpdateTableStoreParam &param)
{
int ret = OB_SUCCESS;
ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "BuildHaTab"));
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObMetaDiskAddr disk_addr;
ObTimeGuard time_guard("ObLSTabletService::build_ha_tablet_new_table_store", 1_s);
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(is_stopped_)) {
ret = OB_NOT_RUNNING;
LOG_WARN("tablet service stopped", K(ret));
} else if (OB_UNLIKELY(!tablet_id.is_valid() || !param.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_id), K(param));
} else {
ObTabletHandle old_tablet_handle;
ObTabletHandle tmp_tablet_handle;
ObTabletHandle new_tablet_handle;
ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash());
time_guard.click("Lock");
if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (old_tablet_handle.get_obj()->is_empty_shell()) {
LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj());
} else {
time_guard.click("GetTablet");
ObTablet *old_tablet = old_tablet_handle.get_obj();
ObTablet *tmp_tablet = nullptr;
const share::ObLSID &ls_id = ls_->get_ls_id();
const ObTabletMapKey key(ls_id, tablet_id);
if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_handle))) {
LOG_WARN("failed to acquire tablet", K(ret), K(key));
} else if (FALSE_IT(tmp_tablet = tmp_tablet_handle.get_obj())) {
} else if (OB_FAIL(tmp_tablet->init_for_sstable_replace(allocator, param, *old_tablet))) {
LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet));
} else if (FALSE_IT(time_guard.click("InitTablet"))) {
} else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_handle))) {
LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_handle));
} else if (FALSE_IT(time_guard.click("Persist"))) {
} else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) {
} else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) {
LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr));
} else if (FALSE_IT(time_guard.click("WrSlog"))) {
} else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) {
LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(disk_addr));
ob_usleep(1000 * 1000);
ob_abort();
} else {
time_guard.click("CASwap");
LOG_INFO("succeed to build ha tablet new table store", K(ret), K(key), K(disk_addr), K(param));
}
}
}
return ret;
}
int ObLSTabletService::need_check_old_row_legitimacy(ObDMLRunningCtx &run_ctx,
bool &need_check,
bool &is_udf)
{
int ret = OB_SUCCESS;
ObRelativeTable &data_table = run_ctx.relative_table_;
need_check = false;
const ObDMLBaseParam &dml_param = run_ctx.dml_param_;
is_udf = false;
// TODO(jingxing): setting this to true
if (OB_FAIL(data_table.has_udf_column(need_check))) {
LOG_WARN("check has udf column failed", K(ret));
} else if (need_check) {
is_udf = true;
ObTableStoreIterator &table_iter = *data_table.tablet_iter_.table_iter();
while (OB_SUCC(ret) && !need_check) {
ObITable *table_ptr = nullptr;
if (OB_FAIL(table_iter.get_next(table_ptr))) {
if (OB_ITER_END != ret) {
LOG_WARN("get next table failed", K(ret));
}
} else if (OB_ISNULL(table_ptr)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("error unexpected, table ptr must not be nullptr", K(ret));
} else {
need_check = table_ptr->is_major_sstable();
}
}
} else if (dml_param.is_batch_stmt_ && !data_table.is_index_table()) {
//batch stmt execution dependency defensive check to check
//if the same row was modified multiple times
need_check = true;
ret = OB_E(EventTable::EN_INS_MULTI_VALUES_BATCH_OPT) OB_SUCCESS;
// no need to check old row, just for bmsql performance optimization
// TODO yuchen.ywc
if (OB_SUCCESS != ret) {
LOG_INFO("error sim when current statement is batch update", K(ret), K(is_udf));
need_check = false;
ret = OB_SUCCESS;
}
} else if (GCONF.enable_defensive_check()) {
need_check = true;
if (data_table.is_index_table() && !data_table.can_read_index()) {
//index can not be read during building index, so does not check old index row
need_check = false;
}
if (ObDmlFlag::DF_LOCK == run_ctx.dml_flag_) {
need_check = false;
}
}
return ret;
}
int ObLSTabletService::construct_table_rows(
const ObNewRow *rows,
ObStoreRow *tbl_rows,
int64_t row_count)
{
int ret = OB_SUCCESS;
if (row_count <= 0) {
ret = OB_ERR_WRONG_VALUE_COUNT_ON_ROW;
LOG_WARN("row count should be bigger than 0", K(row_count), K(ret));
} else {
for (int64_t i = 0; i < row_count; i++) {
tbl_rows[i].row_val_ = rows[i];
}
}
return ret;
}
int ObLSTabletService::check_old_row_legitimacy(
ObTabletHandle &data_tablet_handle,
ObDMLRunningCtx &run_ctx,
const common::ObNewRow &old_row)
{
int ret = OB_SUCCESS;
ObRelativeTable &data_table = run_ctx.relative_table_;
ObStoreRowkey rowkey;
bool need_check = false;
bool is_udf = false;
rowkey.assign(old_row.cells_, data_table.get_rowkey_column_num());
if (OB_UNLIKELY(rowkey.get_obj_cnt() > old_row.count_) || OB_ISNULL(run_ctx.column_ids_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("old row is invalid", K(ret), K(old_row), K(rowkey.get_obj_cnt()), KP(run_ctx.column_ids_));
} else if (OB_FAIL(need_check_old_row_legitimacy(run_ctx, need_check, is_udf))) {
LOG_WARN("identify need check old row legitimacy", K(ret));
} else if (need_check) {
//the vertical partition is no longer maintained,
//and the defense check skips the vertical partition function
const ObDMLBaseParam &dml_param = run_ctx.dml_param_;
ObArenaAllocator scan_allocator(common::ObMemAttr(MTL_ID(), ObModIds::OB_TABLE_SCAN_ITER));
ObIAllocator *allocator = &scan_allocator;
ObSingleRowGetter old_row_getter(*allocator, *data_tablet_handle.get_obj());
ObNewRow *storage_old_row = nullptr;
//check old row whether different with SQL.old_row,
ObDatumRowkey datum_rowkey;
ObDatumRowkeyHelper rowkey_helper;
const ObIArray<uint64_t> &column_ids = *run_ctx.column_ids_;
uint64_t err_col_id = OB_INVALID_ID;
if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) {
STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(rowkey));
} else if (OB_FAIL(init_single_row_getter(old_row_getter, run_ctx, column_ids, data_table, true))) {
LOG_WARN("failed to init single row getter", K(ret));
} else if (OB_FAIL(old_row_getter.open(datum_rowkey, true))) {
LOG_WARN("open old row getter failed", K(ret), K(rowkey));
} else if (OB_FAIL(old_row_getter.get_next_row(storage_old_row))) {
if (OB_ITER_END == ret) {
ret = OB_ERR_DEFENSIVE_CHECK;
FLOG_WARN("old row in storage is not exists", K(ret));
} else {
LOG_WARN("get next row from old_row_iter failed", K(ret), KPC(run_ctx.column_ids_), K(old_row));
}
} else if (OB_ISNULL(storage_old_row)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected error, storage old row is NULL", K(ret));
} else if (storage_old_row->get_count() != old_row.get_count()) {
ret = OB_ERR_DEFENSIVE_CHECK;
FLOG_WARN("storage old row is not matched with sql old row", K(ret));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < old_row.get_count(); ++i) {
const ObObj &storage_val = storage_old_row->get_cell(i);
const ObObj &sql_val = old_row.get_cell(i);
int cmp = 0;
if (sql_val.is_lob_storage()) {
// skip all text and lob
} else if (OB_UNLIKELY(ObLongTextType == storage_val.get_type() && sql_val.is_lob_locator())) {
//skip check lob column type when do the normal sql write check
} else if (OB_UNLIKELY(storage_val.is_nop_value())) {
bool is_nop = false;
if (OB_FAIL(data_table.is_nop_default_value(column_ids.at(i), is_nop))) {
LOG_WARN("check column whether has nop default value failed", K(ret), K(column_ids.at(i)));
} else if (!is_nop) {
err_col_id = column_ids.at(i);
ret = OB_ERR_DEFENSIVE_CHECK;
FLOG_WARN("storage old row is not matched with sql old row", K(ret),
K(i), K(column_ids.at(i)), K(storage_val), K(sql_val));
}
} else if (sql_val.is_nop_value()) {
//this column is nop val, means that this column does not be touched by DML
//just ignore it
} else if (OB_FAIL(storage_val.compare(sql_val, cmp)) || 0 != cmp) {
ret = OB_ERR_DEFENSIVE_CHECK;
err_col_id = column_ids.at(i);
FLOG_WARN("storage_val is not equal with sql_val, maybe catch a bug", K(ret),
K(storage_val), K(sql_val), K(cmp), K(column_ids.at(i)));
}
}
}
if (OB_ERR_DEFENSIVE_CHECK == ret && dml_param.is_batch_stmt_) {
// 批量删除的时候可能索引表的删除在主表前边,所以所有的表在batch删除的时候出现4377,都可能是重复删导致的
ret = OB_BATCHED_MULTI_STMT_ROLLBACK;
LOG_TRACE("batch stmt execution has a correctness error, needs rollback", K(ret),
"column_id", column_ids,
KPC(storage_old_row),
"sql_old_row", old_row,
"dml_param", run_ctx.dml_param_,
"dml_type", run_ctx.dml_flag_);
}
if (OB_ERR_DEFENSIVE_CHECK == ret) {
int tmp_ret = OB_SUCCESS;
bool is_virtual_gen_col = false;
if (OB_TMP_FAIL(check_real_leader_for_4377_(run_ctx.store_ctx_.ls_id_))) {
ret = tmp_ret;
LOG_WARN("check real leader for 4377 found exception", K(ret), K(old_row), K(data_table));
} else if (nullptr != run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_
&& OB_TMP_FAIL(check_need_rollback_in_transfer_for_4377_(run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_,
data_tablet_handle))) {
ret = tmp_ret;
LOG_WARN("check need rollback in transfer for 4377 found exception", K(ret), K(old_row), K(data_table));
} else if (OB_TMP_FAIL(check_parts_tx_state_in_transfer_for_4377_(run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_))) {
ret = tmp_ret;
LOG_WARN("check need rollback in transfer for 4377 found exception", K(ret), K(old_row), K(data_table));
} else if (is_udf) {
ret = OB_ERR_INDEX_KEY_NOT_FOUND;
LOG_WARN("index key not found on udf column", K(ret), K(old_row));
} else if (data_table.is_index_table() && OB_TMP_FAIL(check_is_gencol_check_failed(data_table, err_col_id, is_virtual_gen_col))) {
//don't change ret if gencol check failed
LOG_WARN("check is functional index failed", K(ret), K(tmp_ret), K(data_table));
} else if (is_virtual_gen_col) {
ret = OB_ERR_GENCOL_LEGIT_CHECK_FAILED;
LOG_WARN("Legitimacy check failed for functional index.", K(ret), K(old_row), KPC(storage_old_row));
}
if (OB_ERR_DEFENSIVE_CHECK == ret) {
ObString func_name = ObString::make_string("check_old_row_legitimacy");
LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr());
LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret),
"column_id", column_ids,
KPC(storage_old_row),
"sql_old_row", old_row,
"dml_param", run_ctx.dml_param_,
"dml_flag", run_ctx.dml_flag_,
"store_ctx", run_ctx.store_ctx_,
"relative_table", run_ctx.relative_table_);
LOG_ERROR("Dump data table info", K(ret), K(data_table));
run_ctx.store_ctx_.force_print_trace_log();
}
}
}
return ret;
}
int ObLSTabletService::check_is_gencol_check_failed(const ObRelativeTable &data_table, uint64_t error_col_id, bool &is_virtual_gen_col)
{
int ret = OB_SUCCESS;
is_virtual_gen_col = false;
if (data_table.is_index_table()) {
const ObColumnParam *param = nullptr;
const uint64_t tenant_id = MTL_ID();
uint64_t index_table_id = data_table.get_table_id();
const ObTableSchema *index_table_schema = NULL;
const ObTableSchema *data_table_schema = NULL;
ObMultiVersionSchemaService *schema_service = MTL(ObTenantSchemaService*)->get_schema_service();
ObSchemaGetterGuard schema_guard;
if (OB_ISNULL(schema_service)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected null", K(ret), KP(schema_service));
} else if (OB_FAIL(schema_service->get_tenant_schema_guard(tenant_id, schema_guard))) {
LOG_WARN("failed to get schema manager", K(ret), K(tenant_id));
} else if (OB_FAIL(schema_guard.get_table_schema(tenant_id, index_table_id, index_table_schema))) {
LOG_WARN("get index table schema failed", K(ret));
} else if (OB_ISNULL(index_table_schema)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("index table schema is unexpected null", K(ret));
} else if (OB_FAIL(schema_guard.get_table_schema(tenant_id, index_table_schema->get_data_table_id(), data_table_schema))) {
LOG_WARN("get data table schema failed", K(ret));
} else if (OB_ISNULL(data_table_schema)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("data table schema is unexpected null", K(ret));
} else if (OB_INVALID_ID != error_col_id) {
//check specified column
const ObColumnSchemaV2 *column = NULL;
if (is_shadow_column(error_col_id)) {
//shadow column does not exists in basic table, do nothing
} else if (OB_ISNULL(column = data_table_schema->get_column_schema(error_col_id))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected null", K(ret), KP(column));
} else if (column->is_virtual_generated_column()) {
is_virtual_gen_col = true;
}
} else {
//check all columns
for (ObTableSchema::const_column_iterator iter = index_table_schema->column_begin();
OB_SUCC(ret) && iter != index_table_schema->column_end() && !is_virtual_gen_col; iter++) {
const ObColumnSchemaV2 *column = *iter;
//the column id in the data table is the same with that in the index table
if (OB_ISNULL(column)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected null", K(ret), KP(column));
} else if (is_shadow_column(column->get_column_id())) {
//shadow column does not exists in basic table, do nothing
} else if (OB_ISNULL(column = data_table_schema->get_column_schema(column->get_column_id()))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected null", K(ret), KP(column));
} else if (column->is_virtual_generated_column()) {
is_virtual_gen_col = true;
}
}
}
}
return ret;
}
int ObLSTabletService::check_new_row_legitimacy(
ObDMLRunningCtx &run_ctx,
const common::ObNewRow &new_row)
{
int ret = OB_SUCCESS;
ObRelativeTable &data_table = run_ctx.relative_table_;
int64_t data_table_cnt = data_table.get_column_count();
if (OB_ISNULL(run_ctx.column_ids_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("column ids is nullptr", K(ret));
} else if (OB_FAIL(check_new_row_nullable_value(*run_ctx.column_ids_, data_table, new_row))) {
LOG_WARN("check new row nullable value failed", K(ret),
"dml_param", run_ctx.dml_param_,
"dml_type", run_ctx.dml_flag_);
} else if (OB_FAIL(check_new_row_shadow_pk(*run_ctx.column_ids_, data_table, new_row))) {
LOG_WARN("check new row nullable value failed", K(ret),
"dml_param", run_ctx.dml_param_,
"dml_type", run_ctx.dml_flag_);
}
return ret;
}
int ObLSTabletService::insert_rows_to_tablet(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
const ObNewRow * const rows,
const int64_t row_count,
ObRowsInfo &rows_info,
ObStoreRow *tbl_rows,
int64_t &afct_num,
int64_t &dup_num)
{
int ret = OB_SUCCESS;
ObStoreCtx &ctx = run_ctx.store_ctx_;
const ObDMLBaseParam &dml_param = run_ctx.dml_param_;
ObRelativeTable &data_table = run_ctx.relative_table_;
if (OB_FAIL(ret)) {
} else if (ObClockGenerator::getClock() > dml_param.timeout_) {
ret = OB_TIMEOUT;
int64_t cur_time = ObClockGenerator::getClock();
LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret));
} else if (OB_FAIL(construct_table_rows(rows, tbl_rows, row_count))) {
LOG_WARN("fail to construct table rows", K(ret));
} else if (OB_FAIL(rows_info.check_duplicate(tbl_rows, row_count, data_table))) {
if (OB_ERR_PRIMARY_KEY_DUPLICATE == ret) {
char rowkey_buffer[OB_TMP_BUF_SIZE_256];
if (OB_SUCCESS != extract_rowkey(data_table,
rows_info.get_duplicate_rowkey(),
rowkey_buffer,
OB_TMP_BUF_SIZE_256,
run_ctx.dml_param_.tz_info_)) {
LOG_WARN("extract rowkey failed");
} else {
ObString index_name = "PRIMARY";
if (data_table.is_index_table()) {
data_table.get_index_name(index_name);
}
LOG_USER_ERROR(OB_ERR_PRIMARY_KEY_DUPLICATE,
rowkey_buffer, index_name.length(), index_name.ptr());
}
} else {
LOG_WARN("fail to check duplicate", K(ret));
}
} else if (OB_FAIL(insert_lob_tablet_rows(tablet_handle, run_ctx, tbl_rows, row_count))) {
LOG_WARN("failed to insert rows to lob tablet", K(ret));
} else if (OB_FAIL(insert_tablet_rows(row_count, tablet_handle, run_ctx, tbl_rows, rows_info))) {
LOG_WARN("failed to insert rows to data tablet", K(ret));
} else {
afct_num = afct_num + row_count;
}
return ret;
}
int ObLSTabletService::insert_tablet_rows(
const int64_t row_count,
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
ObStoreRow *rows,
ObRowsInfo &rows_info)
{
int ret = OB_SUCCESS;
ObRelativeTable &table = run_ctx.relative_table_;
const bool check_exists = !table.is_storage_index_table() || table.is_unique_index();
bool exists = false;
// 1. Defensive checking of new rows.
if (GCONF.enable_defensive_check()) {
for (int64_t i = 0; OB_SUCC(ret) && i < row_count; i++) {
ObStoreRow &tbl_row = rows[i];
if (OB_FAIL(check_new_row_legitimacy(run_ctx, tbl_row.row_val_))) {
LOG_WARN("Failed to check new row legitimacy", K(ret), K_(tbl_row.row_val));
}
}
}
// 2. Check uniqueness constraint in memetable only(active + frozen).
// It would be more efficient and elegant to completely merge the uniqueness constraint
// and write conflict checking, but the implementation currently is to minimize intrusion
// into the memtable.
if (check_exists && OB_FAIL(tablet_handle.get_obj()->rowkeys_exists(run_ctx.store_ctx_, table,
rows_info, exists))) {
LOG_WARN("Failed to check the uniqueness constraint", K(ret), K(rows_info));
} else if (exists) {
ret = OB_ERR_PRIMARY_KEY_DUPLICATE;
blocksstable::ObDatumRowkey &duplicate_rowkey = rows_info.get_conflict_rowkey();
LOG_WARN("Rowkey already exist", K(ret), K(table), K(duplicate_rowkey));
}
// 3. Insert rows with uniqueness constraint and write conflict checking.
// Check write conflict in memtable + sstable.
// Check uniqueness constraint in sstable only.
if (OB_SUCC(ret)) {
if (OB_FAIL(tablet_handle.get_obj()->insert_rows(table, run_ctx.store_ctx_, rows, rows_info,
check_exists, *run_ctx.col_descs_, row_count, run_ctx.dml_param_.encrypt_meta_))) {
if (OB_ERR_PRIMARY_KEY_DUPLICATE == ret) {
blocksstable::ObDatumRowkey &duplicate_rowkey = rows_info.get_conflict_rowkey();
LOG_WARN("Rowkey already exist", K(ret), K(table), K(duplicate_rowkey),
K(rows_info.get_conflict_idx()));
} else if (OB_TRY_LOCK_ROW_CONFLICT != ret) {
LOG_WARN("Failed to insert rows to tablet", K(ret), K(rows_info));
}
}
}
// 4. Log user error message if rowkey is duplicate.
if (OB_ERR_PRIMARY_KEY_DUPLICATE == ret && !run_ctx.dml_param_.is_ignore_) {
int tmp_ret = OB_SUCCESS;
char rowkey_buffer[OB_TMP_BUF_SIZE_256];
ObString index_name = "PRIMARY";
if (OB_TMP_FAIL(extract_rowkey(table, rows_info.get_conflict_rowkey(),
rowkey_buffer, OB_TMP_BUF_SIZE_256, run_ctx.dml_param_.tz_info_))) {
LOG_WARN("Failed to extract rowkey", K(ret), K(tmp_ret));
}
if (table.is_index_table()) {
if (OB_TMP_FAIL(table.get_index_name(index_name))) {
LOG_WARN("Failed to get index name", K(ret), K(tmp_ret));
}
} else if (lib::is_oracle_mode() && OB_TMP_FAIL(table.get_primary_key_name(index_name))) {
LOG_WARN("Failed to get pk name", K(ret), K(tmp_ret));
}
LOG_USER_ERROR(OB_ERR_PRIMARY_KEY_DUPLICATE, rowkey_buffer, index_name.length(), index_name.ptr());
}
return ret;
}
int ObLSTabletService::insert_lob_col(
ObDMLRunningCtx &run_ctx,
const ObColDesc &column,
ObObj &obj,
ObLobAccessParam *del_param,
ObLobCommon *lob_common)
{
int ret = OB_SUCCESS;
uint64_t lob_id;
ObLobManager *lob_mngr = MTL(ObLobManager*);
if (OB_ISNULL(lob_mngr)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret));
} else if (!column.col_type_.is_lob_storage() || obj.is_nop_value() || obj.is_null()) {
// do nothing
} else {
// init lob access param
ObLobAccessParam lob_param;
lob_param.tx_desc_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_;
lob_param.parent_seq_no_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_scn_;
lob_param.snapshot_ = run_ctx.dml_param_.snapshot_;
lob_param.is_total_quantity_log_ = run_ctx.dml_param_.is_total_quantity_log_;
if (lob_param.snapshot_.is_none_read()) {
// NOTE:
// lob_insert need table_scan, the snapshot already generated in
// run_ctx.store_ctx, use it as an LS ReadSnapshot
lob_param.snapshot_.init_ls_read(run_ctx.store_ctx_.ls_id_,
run_ctx.store_ctx_.mvcc_acc_ctx_.snapshot_);
}
lob_param.tx_id_ = lob_param.tx_desc_->get_tx_id();
lob_param.sql_mode_ = run_ctx.dml_param_.sql_mode_;
lob_param.ls_id_ = run_ctx.store_ctx_.ls_id_;
lob_param.tablet_id_ = run_ctx.relative_table_.get_tablet_id();
lob_param.coll_type_ = column.col_type_.get_collation_type();
lob_param.allocator_ = &run_ctx.lob_allocator_;
lob_param.lob_common_ = lob_common;
if (OB_NOT_NULL(del_param)) {
lob_param.handle_size_ = del_param->handle_size_;
lob_param.checksum_ = del_param->checksum_;
lob_param.total_seq_cnt_ = del_param->total_seq_cnt_;
lob_param.used_seq_cnt_ = del_param->used_seq_cnt_;
lob_param.seq_no_st_ = del_param->seq_no_st_;
}
lob_param.timeout_ = run_ctx.dml_param_.timeout_;
lob_param.scan_backward_ = false;
lob_param.offset_ = 0;
// Notice: currently only inrow data
ObString raw_data = obj.get_string();
ObString data;
// for not strict sql mode, will insert empty string without lob header
bool has_lob_header = obj.has_lob_header() && raw_data.length() > 0;
ObLobLocatorV2 loc(raw_data, has_lob_header);
if (OB_FAIL(lob_mngr->append(lob_param, loc))) {
LOG_WARN("[STORAGE_LOB]lob append failed.", K(ret));
} else {
ObLobCommon *res_lob_common = lob_param.lob_common_;
obj.set_lob_value(obj.get_type(), res_lob_common, lob_param.handle_size_);
LOG_DEBUG("[STORAGE_LOB]write ob lob data.", K(lob_param), KPC(res_lob_common),
K(lob_param.handle_size_), K(column.col_type_.get_collation_type()));
}
}
return ret;
}
int ObLSTabletService::check_lob_tablet_valid(ObTabletHandle &data_tablet)
{
int ret = OB_SUCCESS;
bool is_valid_aux_lob_table = false;
ObTabletBindingMdsUserData ddl_data;
if (OB_FAIL(data_tablet.get_obj()->ObITabletMdsInterface::get_ddl_data(share::SCN::max_scn(), ddl_data))) {
LOG_WARN("failed to get ddl data from tablet", K(ret), K(data_tablet));
} else {
is_valid_aux_lob_table = ddl_data.lob_meta_tablet_id_.is_valid() && ddl_data.lob_piece_tablet_id_.is_valid();
if (!is_valid_aux_lob_table) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("aux lob table must valid when lob column exist", K(ret), K(ddl_data));
}
}
return ret;
}
int ObLSTabletService::insert_lob_tablet_row(
ObTabletHandle &data_tablet,
ObDMLRunningCtx &run_ctx,
ObStoreRow &row)
{
int ret = OB_SUCCESS;
int64_t col_cnt = run_ctx.col_descs_->count();
ObLobManager *lob_mngr = MTL(ObLobManager*);
bool check_lob = false;
if (OB_ISNULL(lob_mngr)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret));
} else if (row.row_val_.count_ != col_cnt) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]column count invalid", K(ret), K(col_cnt), K(row.row_val_.count_));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) {
const ObColDesc &column = run_ctx.col_descs_->at(i);
ObObj &obj = row.row_val_.get_cell(i);
if (obj.is_null() || obj.is_nop_value()) {
// do nothing
} else if (column.col_type_.is_lob_storage()) {
if (!check_lob) {
if (OB_FAIL(check_lob_tablet_valid(data_tablet))) {
LOG_WARN("failed to check_lob_tablet_valid", K(ret), K(data_tablet));
} else {
check_lob = true;
}
}
if (OB_FAIL(ret)) {
} else if(OB_FAIL(insert_lob_col(run_ctx, column, obj, nullptr, nullptr))) {
LOG_WARN("[STORAGE_LOB]failed to insert lob col.", K(ret), K(row), K(i));
}
}
}
}
return ret;
}
int ObLSTabletService::insert_lob_tablet_rows(
ObTabletHandle &data_tablet,
ObDMLRunningCtx &run_ctx,
ObStoreRow *rows,
int64_t row_count)
{
int ret = OB_SUCCESS;
// DEBUG_SYNC(DELAY_INDEX_WRITE);
ObLobManager *lob_mngr = MTL(ObLobManager*);
if (OB_ISNULL(lob_mngr)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret));
} else {
int64_t col_cnt = run_ctx.col_descs_->count();
for (int64_t k = 0; OB_SUCC(ret) && k < row_count; k++) {
if (OB_FAIL(insert_lob_tablet_row(data_tablet, run_ctx, rows[k]))) {
LOG_WARN("[STORAGE_LOB]failed to insert lob row.", K(ret));
}
}
}
return ret;
}
int ObLSTabletService::extract_rowkey(
const ObRelativeTable &table,
const blocksstable::ObDatumRowkey &rowkey,
char *buffer,
const int64_t buffer_len,
const ObTimeZoneInfo *tz_info)
{
int ret = OB_SUCCESS;
common::ObSEArray<share::schema::ObColDesc, common::OB_MAX_ROWKEY_COLUMN_NUMBER> rowkey_cols;
ObStoreRowkey store_rowkey;
ObDatumRowkeyHelper rowkey_helper;
if (OB_FAIL(table.get_rowkey_column_ids(rowkey_cols))) {
STORAGE_LOG(WARN, "Failed to get rowkey cols", K(ret), K(table));
} else if (OB_FAIL(rowkey_helper.convert_store_rowkey(rowkey, rowkey_cols, store_rowkey))) {
STORAGE_LOG(WARN, "Failed to convert store rowkey", K(ret), K(rowkey));
} else {
ret = extract_rowkey(table, store_rowkey, buffer, buffer_len, tz_info);
}
return ret;
}
int ObLSTabletService::extract_rowkey(
const ObRelativeTable &table,
const common::ObStoreRowkey &rowkey,
char *buffer,
const int64_t buffer_len,
const ObTimeZoneInfo *tz_info)
{
int ret = OB_SUCCESS;
if (!table.is_valid() || !rowkey.is_valid() || OB_ISNULL(buffer) || buffer_len <= 0) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(table), K(rowkey), K(buffer), K(buffer_len), K(tz_info));
} else {
const int64_t rowkey_size = table.get_rowkey_column_num();
int64_t pos = 0;
int64_t valid_rowkey_size = 0;
uint64_t column_id = OB_INVALID_ID;
for (int64_t i = 0; OB_SUCC(ret) && i < rowkey_size; i++) {
if (OB_FAIL(table.get_rowkey_col_id_by_idx(i, column_id))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("Failed to get rowkey column description", K(i), K(ret));
} else if (column_id <= OB_MIN_SHADOW_COLUMN_ID) {
valid_rowkey_size ++;
}
}
for (int64_t i = 0; OB_SUCC(ret) && i < valid_rowkey_size; ++i) {
const ObObj &obj = rowkey.get_obj_ptr()[i];
if (OB_FAIL(obj.print_plain_str_literal(buffer, buffer_len - 1, pos, tz_info))) {
LOG_WARN("fail to print_plain_str_literal", K(ret));
} else if (i < valid_rowkey_size - 1) {
if (OB_FAIL(databuff_printf(buffer, buffer_len - 1, pos, "-"))) {
LOG_WARN("databuff print failed", K(ret));
}
}
}
if (buffer != nullptr) {
buffer[pos++] = '\0';
}
}
return ret;
}
int ObLSTabletService::get_next_rows(
ObNewRowIterator *row_iter,
ObNewRow *&rows,
int64_t &row_count)
{
return row_iter->get_next_rows(rows, row_count);
}
int ObLSTabletService::construct_update_idx(
const int64_t schema_rowkey_cnt,
const share::schema::ColumnMap *col_map,
const common::ObIArray<uint64_t> &upd_col_ids,
UpdateIndexArray &update_idx)
{
int ret = OB_SUCCESS;
int err = OB_SUCCESS;
if (OB_ISNULL(col_map) || upd_col_ids.count() <= 0 || update_idx.count() > 0 || schema_rowkey_cnt <= 0) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(col_map), K(upd_col_ids), K(upd_col_ids.count()), K(schema_rowkey_cnt));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < upd_col_ids.count(); ++i) {
int32_t idx = -1;
const uint64_t &col_id = upd_col_ids.at(i);
if (OB_SUCCESS != (err = col_map->get(col_id, idx)) || idx < 0) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("column id doesn't exist", K(ret), K(col_id), K(err));
} else if (idx < schema_rowkey_cnt) {
// update_idx should not contain rowkey
} else if (OB_FAIL(update_idx.push_back(idx))) {
LOG_WARN("fail to push idx into update_idx", K(ret), K(idx));
}
}
if (OB_SUCC(ret) && update_idx.count() > 1) {
std::sort(update_idx.begin(), update_idx.end());
}
}
return ret;
}
int ObLSTabletService::check_rowkey_change(
const ObIArray<uint64_t> &update_ids,
const ObRelativeTable &relative_table,
bool &rowkey_change,
bool &delay_new)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(update_ids.count() <= 0 || !relative_table.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(update_ids), K(ret));
} else {
const int64_t count = update_ids.count();
bool is_rowkey = false;
rowkey_change = false;
delay_new = false;
for (int64_t i = 0; OB_SUCC(ret) && i < count && !rowkey_change; ++i) {
if (OB_FAIL(relative_table.is_rowkey_column_id(update_ids.at(i), is_rowkey))) {
LOG_WARN("check is_rowkey fail", K(ret), K(update_ids.at(i)));
} else {
rowkey_change = is_rowkey;
}
}
if (OB_FAIL(ret)) {
// do nothing
} else if (relative_table.is_unique_index() && !rowkey_change) {
uint64_t cid = OB_INVALID_ID;
bool innullable = true;
for (int64_t j = 0; OB_SUCC(ret) && j < relative_table.get_rowkey_column_num() && !rowkey_change; ++j) {
if (OB_FAIL(relative_table.get_rowkey_col_id_by_idx(j, cid))) {
LOG_WARN("get rowkey column id fail", K(ret), K(j));
} else if (cid > OB_MIN_SHADOW_COLUMN_ID) {
if (innullable) {
break; // other_change
} else {
cid -= OB_MIN_SHADOW_COLUMN_ID;
for (int64_t k = 0; OB_SUCC(ret) && k < count; ++k) {
if (cid == update_ids.at(k)) {
rowkey_change = true;
break;
}
}
}
} else {
bool is_nullable = false;
if (OB_FAIL(relative_table.is_column_nullable_for_write(cid, is_nullable))) {
LOG_WARN("check nullable fail", K(ret), K(cid), K(relative_table));
} else if (is_nullable) {
innullable = false;
}
}
}
}
if (OB_SUCC(ret) && rowkey_change) {
delay_new = true;
}
LOG_DEBUG("check rowkey change for update", K(rowkey_change), K(delay_new), K(update_ids), K(relative_table));
}
return ret;
}
int ObLSTabletService::check_rowkey_value_change(
const common::ObNewRow &old_row,
const common::ObNewRow &new_row,
const int64_t rowkey_len,
bool &rowkey_change)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(rowkey_len <= 0)
|| OB_UNLIKELY(old_row.count_ < rowkey_len)
|| OB_UNLIKELY(new_row.count_ < rowkey_len)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(old_row), K(new_row),
K(rowkey_len), K(ret));
} else {
rowkey_change = false;
for (int64_t i = 0; !rowkey_change && i < rowkey_len; ++i) {
if (old_row.cells_[i] != new_row.cells_[i]) {
rowkey_change = true;
}
}
}
LOG_DEBUG("check rowkey value for update", K(rowkey_change), K(old_row), K(new_row));
return ret;
}
int ObLSTabletService::process_delta_lob(
ObDMLRunningCtx &run_ctx,
const ObColDesc &column,
ObObj &old_obj,
ObLobLocatorV2 &delta_lob,
ObObj &obj)
{
int ret = OB_SUCCESS;
ObLobManager *lob_mngr = MTL(ObLobManager*);
if (OB_ISNULL(lob_mngr)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret));
} else if (!delta_lob.is_delta_temp_lob()) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB] invalid lob type", K(ret), K(delta_lob));
} else {
ObLobAccessParam lob_param;
// init lob param
lob_param.tx_desc_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_;
lob_param.parent_seq_no_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_scn_;
lob_param.snapshot_ = run_ctx.dml_param_.snapshot_;
if (lob_param.snapshot_.is_none_read()) {
// NOTE:
// lob_insert need table_scan, the snapshot already generated in
// run_ctx.store_ctx, use it as an LS ReadSnapshot
lob_param.snapshot_.init_ls_read(run_ctx.store_ctx_.ls_id_,
run_ctx.store_ctx_.mvcc_acc_ctx_.snapshot_);
}
lob_param.tx_id_ = lob_param.tx_desc_->get_tx_id();
lob_param.sql_mode_ = run_ctx.dml_param_.sql_mode_;
lob_param.ls_id_ = run_ctx.store_ctx_.ls_id_;
lob_param.tablet_id_ = run_ctx.relative_table_.get_tablet_id();
lob_param.coll_type_ = column.col_type_.get_collation_type();
lob_param.allocator_ = &run_ctx.lob_allocator_;
// should use old obj lob
ObLobLocatorV2 old_lob;
ObString old_disk_lob;
if (OB_FAIL(old_obj.get_lob_locatorv2(old_lob))) {
LOG_WARN("get old lob locator failed.", K(ret), K(old_obj));
} else if (!old_lob.is_valid()) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("old lob locator is invalid.", K(ret));
} else if (OB_FAIL(old_lob.get_disk_locator(old_disk_lob))) {
LOG_WARN("fail to get old lob disk locator.", K(ret));
} else {
lob_param.lob_locator_ = nullptr;
lob_param.lob_common_ = reinterpret_cast<ObLobCommon*>(old_disk_lob.ptr());
lob_param.handle_size_ = old_disk_lob.length();
lob_param.byte_size_ = lob_param.lob_common_->get_byte_size(lob_param.handle_size_);
lob_param.timeout_ = run_ctx.dml_param_.timeout_;
lob_param.scan_backward_ = false;
if (OB_FAIL(lob_mngr->process_delta(lob_param, delta_lob))) {
LOG_WARN("failed to process delta lob.", K(ret), K(lob_param), K(delta_lob));
} else {
// update obj with new disk locator
obj.set_lob_value(obj.get_type(), lob_param.lob_common_, lob_param.handle_size_);
}
}
}
return ret;
}
int ObLSTabletService::process_lob_row(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
const ObIArray<int64_t> &update_idx,
bool data_tbl_rowkey_change,
ObStoreRow &old_sql_row,
ObStoreRow &old_row,
ObStoreRow &new_row)
{
int ret = OB_SUCCESS;
bool check_lob = false;
if (OB_UNLIKELY(old_row.row_val_.get_count() != new_row.row_val_.get_count())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("[STORAGE_LOB]invalid args", K(old_row), K(new_row), K(ret));
} else if (OB_UNLIKELY(old_row.row_val_.get_count() != run_ctx.col_descs_->count())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("[STORAGE_LOB]invalid args", K(old_row), K(new_row), KPC(run_ctx.col_descs_));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < old_row.row_val_.get_count(); ++i) {
if (run_ctx.col_descs_->at(i).col_type_.is_lob_storage()) {
ObObj &old_obj = old_row.row_val_.get_cell(i);
ObObj &old_sql_obj = old_sql_row.row_val_.get_cell(i);
ObObj &new_obj = new_row.row_val_.get_cell(i);
bool is_update = false;
for (int64_t j = 0; !is_update && j < update_idx.count(); ++j) {
if (update_idx.at(j) == i) {
is_update = true;
}
}
if (is_update) {
if (!check_lob) {
if (OB_FAIL(check_lob_tablet_valid(tablet_handle))) {
LOG_WARN("failed to check_lob_tablet_valid", K(ret), K(tablet_handle));
} else {
check_lob = true;
}
}
// get new lob locator
ObString new_lob_str = (new_obj.is_null() || new_obj.is_nop_value())
? ObString(0, nullptr) : new_obj.get_string();
ObLobLocatorV2 new_lob(new_lob_str, new_obj.has_lob_header());
if (OB_FAIL(ret)) {
} else if (new_obj.is_null() ||
new_obj.is_nop_value() ||
new_lob.is_full_temp_lob() ||
new_lob.is_persist_lob() ||
(new_lob.is_lob_disk_locator() && new_lob.has_inrow_data())) {
ObLobCommon *lob_common = nullptr;
ObLobAccessParam lob_param;
if (OB_FAIL(new_lob.get_lob_data_byte_len(lob_param.update_len_))) {
LOG_WARN("fail to get new lob byte len", K(ret), K(new_lob), K(i));
} else if (OB_FAIL(delete_lob_col(run_ctx, run_ctx.col_descs_->at(i), old_obj, old_sql_obj, lob_common, lob_param))) {
LOG_WARN("[STORAGE_LOB]failed to erase old lob col", K(ret), K(old_sql_row), K(old_row), K(i));
} else if (OB_FAIL(insert_lob_col(run_ctx, run_ctx.col_descs_->at(i), new_obj, &lob_param, lob_common))) {
LOG_WARN("[STORAGE_LOB]failed to insert new lob col.", K(ret), K(new_row), K(i));
}
} else if (new_lob.is_delta_temp_lob()) {
if (OB_FAIL(process_delta_lob(run_ctx, run_ctx.col_descs_->at(i), old_sql_obj, new_lob, new_obj))) {
LOG_WARN("failed to process delta lob.", K(ret), K(i));
}
} else {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected obj for new lob", K(ret), K(i), K(new_obj), K(new_lob));
}
} else {
if (old_obj.is_null()) {
new_obj.set_null();
} else if (old_obj.is_nop_value()) {
new_obj.set_nop_value();
} else if (new_obj.is_nop_value() || new_obj.is_null()) {
// do nothing
} else {
if (old_obj.is_null()) {
new_obj.set_null();
} else if (old_obj.is_nop_value()) {
new_obj.set_nop_value();
} else {
ObString val_str = old_obj.get_string();
ObLobCommon *lob_common = reinterpret_cast<ObLobCommon*>(val_str.ptr());
if (!lob_common->in_row_ && data_tbl_rowkey_change) {
ObLobAccessParam lob_param;
if (val_str.length() < ObLobManager::LOB_WITH_OUTROW_CTX_SIZE) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("not enough space for lob header", K(ret), K(val_str), K(i));
} else if (OB_FAIL(delete_lob_col(run_ctx, run_ctx.col_descs_->at(i), old_obj, old_sql_obj, lob_common, lob_param))) {
LOG_WARN("[STORAGE_LOB]failed to erase old lob col", K(ret), K(old_sql_row), K(old_row), K(i));
} else if (OB_FAIL(insert_lob_col(run_ctx, run_ctx.col_descs_->at(i), new_obj, nullptr, nullptr))) { // no need del_param
LOG_WARN("[STORAGE_LOB]failed to insert new lob col.", K(ret), K(new_row), K(i));
}
} else {
new_obj.set_lob_value(new_obj.get_type(), val_str.ptr(), val_str.length()); // remove has lob header flag
}
}
}
}
}
}
}
return ret;
}
int ObLSTabletService::update_row_to_tablet(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
const bool rowkey_change,
const ObIArray<int64_t> &update_idx,
const bool delay_new,
const bool lob_update,
ObStoreRow &old_tbl_row,
ObStoreRow &new_tbl_row,
ObRowStore *row_store,
bool &duplicate)
{
int ret = OB_SUCCESS;
const ObDMLBaseParam &dml_param = run_ctx.dml_param_;
const ObColDescIArray &col_descs = *run_ctx.col_descs_;
bool data_tbl_rowkey_change = false;
int64_t data_tbl_rowkey_len = run_ctx.relative_table_.get_rowkey_column_num();
ObSQLMode sql_mode = dml_param.sql_mode_;
duplicate = false;
ObStoreRow old_sql_tbl_row;
old_sql_tbl_row.row_val_ = old_tbl_row.row_val_;
if (OB_UNLIKELY(col_descs.count() != old_tbl_row.row_val_.get_count()
|| col_descs.count() != new_tbl_row.row_val_.get_count())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(col_descs.count()),
K(old_tbl_row.row_val_), K(new_tbl_row.row_val_));
} else if (rowkey_change && OB_FAIL(check_rowkey_value_change(old_tbl_row.row_val_,
new_tbl_row.row_val_,
data_tbl_rowkey_len,
data_tbl_rowkey_change))) {
LOG_WARN("failed to check data table rowkey change", K(ret),
K(old_tbl_row), K(new_tbl_row), K(data_tbl_rowkey_len));
} else if (OB_FAIL(process_old_row(tablet_handle,
run_ctx,
data_tbl_rowkey_change,
lob_update,
old_tbl_row))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("fail to process old row", K(ret), K(*run_ctx.col_descs_),
K(old_tbl_row), K(data_tbl_rowkey_change));
}
} else if (OB_FAIL(process_lob_row(tablet_handle,
run_ctx,
update_idx,
data_tbl_rowkey_change,
old_sql_tbl_row,
old_tbl_row,
new_tbl_row))) {
LOG_WARN("failed to process lob col change", K(ret), K(old_tbl_row), K(new_tbl_row));
} else if (delay_new && lib::is_oracle_mode()) {
// if total quantity log is needed, we should cache both new row and old row,
// and the sequence is new_row1, old_row1, new_row2, old_row2....,
// if total quantity log isn't needed, just cache new row
if (OB_ISNULL(row_store)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("row_store is NULL", K(ret));
} else if (OB_FAIL(row_store->add_row(new_tbl_row.row_val_))) {
LOG_WARN("failed to store new row", K(new_tbl_row), K(ret));
} else if (OB_FAIL(row_store->add_row(old_tbl_row.row_val_))) {
LOG_WARN("failed to store old row", K(old_tbl_row), K(ret));
} else {
LOG_DEBUG("add row store for delay new", K(old_tbl_row), K(new_tbl_row));
}
} else if (OB_FAIL(process_new_row(tablet_handle,
run_ctx,
update_idx,
old_tbl_row,
new_tbl_row,
data_tbl_rowkey_change))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("fail to process new row", K(new_tbl_row), K(ret));
}
}
return ret;
}
int ObLSTabletService::process_old_row(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
const bool data_tbl_rowkey_change,
const bool lob_update,
ObStoreRow &tbl_row)
{
int ret = OB_SUCCESS;
ObStoreCtx &store_ctx = run_ctx.store_ctx_;
ObRelativeTable &relative_table = run_ctx.relative_table_;
bool is_delete_total_quantity_log = run_ctx.dml_param_.is_total_quantity_log_;
if (OB_UNLIKELY(!relative_table.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid relative tables", K(ret), K(relative_table));
} else if (OB_UNLIKELY(!store_ctx.is_valid()
|| nullptr == run_ctx.col_descs_
|| run_ctx.col_descs_->count() <= 0
|| !tbl_row.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(store_ctx), KP(run_ctx.col_descs_), K(tbl_row), K(is_delete_total_quantity_log));
} else if (OB_FAIL(check_old_row_legitimacy(tablet_handle, run_ctx, tbl_row.row_val_))) {
if (OB_ERR_DEFENSIVE_CHECK == ret) {
dump_diag_info_for_old_row_loss(relative_table, store_ctx, tbl_row);
}
LOG_WARN("check old row legitimacy failed", K(tbl_row.row_val_));
} else if (OB_FAIL(process_old_row_lob_col(tablet_handle, run_ctx, tbl_row))){
LOG_WARN("failed to process old row lob col", K(ret), K(tbl_row));
} else {
ObColDescIArray &col_descs = const_cast<ObColDescIArray&>(*run_ctx.col_descs_);
const uint64_t &table_id = relative_table.get_table_id();
int64_t rowkey_size = relative_table.get_rowkey_column_num();
ObStoreRowkey store_rowkey;
ObDatumRowkey datum_rowkey;
ObDatumRowkeyHelper rowkey_helper(run_ctx.allocator_);
if (OB_UNLIKELY(run_ctx.dml_param_.prelock_)) {
bool locked = false;
if (OB_FAIL(store_rowkey.assign(tbl_row.row_val_.cells_, rowkey_size))) {
LOG_WARN("Failed to assign rowkey", K(ret), K(tbl_row), K(rowkey_size));
} else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(store_rowkey.get_rowkey(), datum_rowkey))) {
STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(store_rowkey), K(rowkey_size), K(tbl_row));
} else if (OB_FAIL(check_row_locked_by_myself(tablet_handle, relative_table, store_ctx, datum_rowkey, locked))) {
LOG_WARN("fail to check row locked", K(ret), K(tbl_row));
} else if (!locked) {
ret = OB_ERR_ROW_NOT_LOCKED;
LOG_DEBUG("row has not been locked", K(ret), K(tbl_row));
}
}
if (OB_FAIL(ret)) {
} else if (data_tbl_rowkey_change) {
ObStoreRow del_row(tbl_row);
del_row.flag_.set_flag(ObDmlFlag::DF_DELETE);
if (!is_delete_total_quantity_log) {
if (OB_FAIL(tablet_handle.get_obj()->insert_row_without_rowkey_check(relative_table,
run_ctx.store_ctx_, col_descs, del_row, run_ctx.dml_param_.encrypt_meta_))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("failed to write data tablet row", K(ret), K(del_row));
}
}
} else {
ObStoreRow new_tbl_row;
new_tbl_row.flag_.set_flag(ObDmlFlag::DF_DELETE);
new_tbl_row.row_val_ = tbl_row.row_val_;
del_row.flag_.set_flag(ObDmlFlag::DF_UPDATE);
ObSEArray<int64_t, 8> update_idx;
if (OB_FAIL(tablet_handle.get_obj()->update_row(relative_table,
run_ctx.store_ctx_, col_descs, update_idx, del_row, new_tbl_row, run_ctx.dml_param_.encrypt_meta_))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("failed to write data tablet row", K(ret), K(del_row), K(new_tbl_row));
}
}
}
} else if (lob_update) {
// need to lock main table rows that don't need to be deleted
if (OB_FAIL(store_rowkey.assign(tbl_row.row_val_.cells_, rowkey_size))) {
LOG_WARN("Failed to assign rowkey", K(ret), K(tbl_row), K(rowkey_size));
} else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(store_rowkey.get_rowkey(), datum_rowkey))) {
STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(store_rowkey));
} else if (OB_FAIL(tablet_handle.get_obj()->lock_row(relative_table, store_ctx, datum_rowkey))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("lock row failed", K(ret), K(table_id), K(tbl_row), K(rowkey_size));
}
}
LOG_DEBUG("generate lock node before update lob columns", K(ret), K(table_id), K(tbl_row));
}
}
return ret;
}
int ObLSTabletService::process_new_row(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
const common::ObIArray<int64_t> &update_idx,
const ObStoreRow &old_tbl_row,
const ObStoreRow &new_tbl_row,
const bool rowkey_change)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(update_idx.count() < 0 || !new_tbl_row.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(update_idx), K(new_tbl_row), K(rowkey_change));
} else if (GCONF.enable_defensive_check()
&& OB_FAIL(check_new_row_legitimacy(run_ctx, new_tbl_row.row_val_))) {
LOG_WARN("check new row legitimacy failed", K(ret), K(new_tbl_row.row_val_));
} else {
// write full column clog needs to construct update_idx and pass to memtable
if (OB_FAIL(process_data_table_row(tablet_handle,
run_ctx,
update_idx,
old_tbl_row,
new_tbl_row,
rowkey_change))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("fail to process data table row", K(ret),
K(update_idx), K(old_tbl_row), K(new_tbl_row), K(rowkey_change));
}
}
}
return ret;
}
int ObLSTabletService::process_data_table_row(
ObTabletHandle &data_tablet,
ObDMLRunningCtx &run_ctx,
const ObIArray<int64_t> &update_idx,
const ObStoreRow &old_tbl_row,
const ObStoreRow &new_tbl_row,
const bool rowkey_change)
{
int ret = OB_SUCCESS;
ObStoreCtx &ctx = run_ctx.store_ctx_;
ObRelativeTable &relative_table = run_ctx.relative_table_;
bool is_update_total_quantity_log = run_ctx.dml_param_.is_total_quantity_log_;
const common::ObTimeZoneInfo *tz_info = run_ctx.dml_param_.tz_info_;
if (OB_UNLIKELY(!ctx.is_valid()
|| !relative_table.is_valid()
|| nullptr == run_ctx.col_descs_
|| run_ctx.col_descs_->count() <= 0
|| update_idx.count() < 0
|| (is_update_total_quantity_log && !old_tbl_row.is_valid())
|| !new_tbl_row.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ctx),
KP(run_ctx.col_descs_), K(update_idx), K(old_tbl_row), K(new_tbl_row),
K(is_update_total_quantity_log), K(rowkey_change));
} else {
const ObColDescIArray &col_descs = *run_ctx.col_descs_;
bool exists = false;
if (rowkey_change && OB_FAIL(data_tablet.get_obj()->rowkey_exists(
relative_table,
ctx,
new_tbl_row.row_val_,
exists))) {
LOG_WARN("failed to check rowkey exists", K(ret), K(new_tbl_row));
} else if (exists) {
char buffer[OB_TMP_BUF_SIZE_256];
ObStoreRowkey rowkey;
ret = OB_ERR_PRIMARY_KEY_DUPLICATE;
if (OB_SUCCESS != rowkey.assign(new_tbl_row.row_val_.cells_, relative_table.get_rowkey_column_num())) {
LOG_WARN("Failed to assign rowkey", K(new_tbl_row));
} else if (OB_SUCCESS != extract_rowkey(relative_table, rowkey, buffer, OB_TMP_BUF_SIZE_256, tz_info)) {
LOG_WARN("extract rowkey failed", K(rowkey));
} else {
ObString index_name = "PRIMARY";
if (relative_table.is_index_table()) {
relative_table.get_index_name(index_name);
}
LOG_USER_ERROR(OB_ERR_PRIMARY_KEY_DUPLICATE, buffer, index_name.length(), index_name.ptr());
}
LOG_WARN("rowkey already exists", K(ret), K(new_tbl_row));
} else {
ObStoreRow new_row;
new_row.flag_.set_flag(rowkey_change ? ObDmlFlag::DF_INSERT : ObDmlFlag::DF_UPDATE);
new_row.row_val_ = new_tbl_row.row_val_;
if (is_update_total_quantity_log && !rowkey_change) {
ObStoreRow old_row;
old_row.flag_.set_flag(ObDmlFlag::DF_UPDATE);
old_row.row_val_ = old_tbl_row.row_val_;
if (OB_FAIL(data_tablet.get_obj()->update_row(relative_table,
ctx, col_descs, update_idx, old_row, new_row, run_ctx.dml_param_.encrypt_meta_))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("failed to update to row", K(ret), K(old_row), K(new_row));
}
}
} else {
if (OB_FAIL(data_tablet.get_obj()->insert_row_without_rowkey_check(relative_table,
ctx, col_descs, new_row, run_ctx.dml_param_.encrypt_meta_))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("failed to update to row", K(ret), K(new_row));
}
}
}
}
}
return ret;
}
int ObLSTabletService::check_new_row_nullable_value(
const ObIArray<uint64_t> &column_ids,
ObRelativeTable &data_table,
const ObNewRow &new_row)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(column_ids.count() != new_row.get_count())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("new row is invalid", K(ret), K(new_row.get_count()), K(column_ids.count()));
}
for (int64_t i = 0; OB_SUCC(ret) && i < column_ids.count(); ++i) {
uint64_t column_id = column_ids.at(i);
bool is_nullable = false;
if (OB_UNLIKELY(is_shadow_column(column_id))) {
//the shadow pk is generated internally,
//and the nullable attribute check for it is skipped
} else if (OB_FAIL(data_table.is_column_nullable_for_write(column_id, is_nullable))) {
LOG_WARN("check is_column_nullable_for_write failed", K(ret), K(column_id));
} else if (new_row.get_cell(i).is_null() && !is_nullable) {
bool is_hidden = false;
bool is_gen_col = false;
bool is_nullable_for_read = false;
if (OB_FAIL(data_table.is_column_nullable_for_read(column_id, is_nullable_for_read))) {
LOG_WARN("check is nullable for read failed", K(ret));
} else if (is_nullable_for_read) {
LOG_TRACE("Catch a defensive nullable error, but this column is not null novalidate",
K(column_id), K(column_ids), K(new_row), K(data_table));
} else if (OB_FAIL(data_table.is_hidden_column(column_id, is_hidden))) {
LOG_WARN("get is hidden column failed", K(ret), K(column_id));
} else if (OB_FAIL(data_table.is_gen_column(column_id, is_gen_col))) {
LOG_WARN("get is gen column failed", K(ret), K(column_id));
} else if (is_hidden && !is_gen_col) {
ret = OB_BAD_NULL_ERROR;
LOG_WARN("Catch a defensive nullable error, "
"maybe cause by add column not null default null ONLINE", K(ret),
K(column_id), K(column_ids), K(new_row), K(data_table));
} else {
ret = OB_ERR_DEFENSIVE_CHECK;
ObString func_name = ObString::make_string("check_new_row_nullable_value");
LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr());
LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret),
K(column_id), K(column_ids), K(new_row), K(data_table));
}
} else if (new_row.get_cell(i).is_number()) {
number::ObNumber num;
if (OB_FAIL(new_row.get_cell(i).get_number(num))) {
LOG_WARN("get number value from object fail", K(ret), K(new_row.get_cell(i)));
} else if (OB_FAIL(num.sanity_check())) {
LOG_WARN("sanity check number failed", K(ret), K(new_row.get_cell(i)));
}
if (OB_SUCCESS != ret) {
ret = OB_ERR_DEFENSIVE_CHECK;
ObString func_name = ObString::make_string("check_new_row_nullable_value");
LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr());
LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret),
K(column_id), K(column_ids), K(new_row), K(data_table));
}
}
}
return ret;
}
int ObLSTabletService::check_new_row_nullable_value(const ObIArray<ObColDesc> &col_descs,
ObRelativeTable &relative_table,
const ObNewRow &new_row)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(col_descs.count() > new_row.get_count())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("new row is invalid", K(ret), K(new_row.get_count()), K(col_descs.count()));
}
for (int64_t i = 0; OB_SUCC(ret) && i < col_descs.count(); ++i) {
uint64_t column_id = col_descs.at(i).col_id_;
bool is_nullable = false;
if (OB_UNLIKELY(is_shadow_column(column_id))) {
//the shadow pk is generated internally,
//and the nullable attribute check for it is skipped
} else if (OB_FAIL(relative_table.is_column_nullable_for_write(column_id, is_nullable))) {
LOG_WARN("check is_column_nullable_for_write failed", K(ret), K(column_id));
} else if (new_row.get_cell(i).is_null() && !is_nullable) {
bool is_hidden = false;
bool is_gen_col = false;
bool is_nullable_for_read = false;
if (OB_FAIL(relative_table.is_column_nullable_for_read(column_id, is_nullable_for_read))) {
LOG_WARN("check is nullable for read failed", K(ret));
} else if (is_nullable_for_read) {
//this column is not null novalidate, maybe the null column come from the old data
//so output trace log and ignore it
LOG_TRACE("Catch a defensive nullable error, but this column is not null novalidate",
K(column_id), K(col_descs), K(new_row), K(relative_table));
} else if (OB_FAIL(relative_table.is_hidden_column(column_id, is_hidden))) {
LOG_WARN("get is hidden column failed", K(ret), K(column_id));
} else if (OB_FAIL(relative_table.is_gen_column(column_id, is_gen_col))) {
LOG_WARN("get is gen column failed", K(ret), K(column_id));
} else if (is_hidden && !is_gen_col) {
ret = OB_BAD_NULL_ERROR;
LOG_WARN("Catch a defensive nullable error, "
"maybe cause by add column not null default null ONLINE", K(ret),
K(column_id), K(col_descs), K(new_row), K(relative_table));
} else {
ret = OB_ERR_DEFENSIVE_CHECK;
ObString func_name = ObString::make_string("check_new_row_nullable_value");
LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr());
LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret),
K(column_id), K(col_descs), K(new_row), K(relative_table));
}
} else if (new_row.get_cell(i).is_number()) {
number::ObNumber num;
if (OB_FAIL(new_row.get_cell(i).get_number(num))) {
LOG_WARN("get number value from object fail", K(ret), K(new_row.get_cell(i)));
} else if (OB_FAIL(num.sanity_check())) {
LOG_WARN("sanity check number failed", K(ret), K(new_row.get_cell(i)));
}
if (OB_SUCCESS != ret) {
ret = OB_ERR_DEFENSIVE_CHECK;
ObString func_name = ObString::make_string("check_new_row_nullable_value");
LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr());
LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret),
K(column_id), K(col_descs), K(new_row), K(relative_table));
}
}
}
return ret;
}
int ObLSTabletService::check_new_row_shadow_pk(
const ObIArray<uint64_t> &column_ids,
ObRelativeTable &data_table,
const ObNewRow &new_row)
{
int ret = OB_SUCCESS;
if (data_table.get_shadow_rowkey_column_num() > 0) {
//check shadow pk
int64_t rowkey_cnt = data_table.get_rowkey_column_num();
int64_t spk_cnt = data_table.get_shadow_rowkey_column_num();
int64_t index_col_cnt = rowkey_cnt - spk_cnt;
bool need_spk = false;
if (OB_UNLIKELY(index_col_cnt <= 0) || OB_UNLIKELY(column_ids.count() < rowkey_cnt)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("index column count is invalid", K(ret),
K(index_col_cnt), K(rowkey_cnt), K(spk_cnt), K(column_ids.count()));
} else if (lib::is_mysql_mode()) {
// mysql兼容:只要unique index key中有null列,则需要填充shadow列
bool rowkey_has_null = false;
for (int64_t i = 0; !rowkey_has_null && i < index_col_cnt; i++) {
rowkey_has_null = new_row.get_cell(i).is_null();
}
need_spk = rowkey_has_null;
} else {
// oracle兼容:只有unique index key全为null列时,才需要填充shadow列
bool is_rowkey_all_null = true;
for (int64_t i = 0; is_rowkey_all_null && i < index_col_cnt; i++) {
is_rowkey_all_null = new_row.get_cell(i).is_null();
}
need_spk = is_rowkey_all_null;
}
for (int64_t i = index_col_cnt; OB_SUCC(ret) && i < rowkey_cnt; ++i) {
uint64_t spk_column_id = column_ids.at(i);
uint64_t real_pk_id = spk_column_id - OB_MIN_SHADOW_COLUMN_ID;
const ObObj &spk_value = new_row.get_cell(i);
int64_t pk_idx = OB_INVALID_INDEX;
int cmp = 0;
if (OB_LIKELY(!need_spk)) {
if (!spk_value.is_null()) {
ret = OB_ERR_DEFENSIVE_CHECK;
ObString func_name = ObString::make_string("check_new_row_shadow_pk");
LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr());
LOG_ERROR("Fatal Error!!! Catch a defensive error!", K(ret),
"column_id", column_ids, K(new_row), K(data_table),
K(spk_value), K(i), K(spk_column_id), K(real_pk_id));
}
} else if (OB_UNLIKELY(!has_exist_in_array(column_ids, real_pk_id, &pk_idx))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("real pk column not exists in column_ids", K(ret), K(column_ids), K(real_pk_id));
} else if (OB_FAIL(new_row.get_cell(pk_idx).compare(spk_value, cmp)) || 0 != cmp) {
ret = OB_ERR_DEFENSIVE_CHECK;
ObString func_name = ObString::make_string("check_new_row_shadow_pk");
LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr());
LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret),
"column_id", column_ids, K(new_row), K(data_table),
K(spk_value), "pk_value", new_row.get_cell(pk_idx),
K(pk_idx), K(i), K(spk_column_id), K(real_pk_id));
}
}
}
return ret;
}
int ObLSTabletService::check_row_locked_by_myself(
ObTabletHandle &tablet_handle,
ObRelativeTable &relative_table,
ObStoreCtx &store_ctx,
const ObDatumRowkey &rowkey,
bool &locked)
{
int ret = OB_SUCCESS;
ObTablet *tablet = tablet_handle.get_obj();
if (OB_UNLIKELY(nullptr == tablet
|| !relative_table.is_valid()
|| !store_ctx.is_valid()
|| !rowkey.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(tablet_handle),
K(relative_table), K(store_ctx), K(rowkey));
} else {
ObStorageTableGuard guard(tablet, store_ctx, true);
if (OB_FAIL(guard.refresh_and_protect_table(relative_table))) {
LOG_WARN("fail to protect table", K(ret), K(tablet_handle));
} else if (OB_FAIL(tablet->check_row_locked_by_myself(relative_table, store_ctx, rowkey, locked))) {
LOG_WARN("fail to check row locked, ", K(ret), K(rowkey));
}
}
return ret;
}
int ObLSTabletService::get_conflict_rows(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
const ObInsertFlag flag,
const common::ObIArray<uint64_t> &out_col_ids,
const common::ObNewRow &row,
common::ObNewRowIterator *&duplicated_rows)
{
TRANS_LOG(DEBUG, "get conflict rows", K(flag), K(row), K(lbt()));
int ret = OB_SUCCESS;
ObRelativeTable &data_table = run_ctx.relative_table_;
ObArenaAllocator scan_allocator(common::ObMemAttr(MTL_ID(), ObModIds::OB_TABLE_SCAN_ITER));
ObIAllocator *allocator = &scan_allocator;
ObTablet *data_tablet = tablet_handle.get_obj();
ObDatumRowkeyHelper rowkey_helper(scan_allocator);
ObDatumRowkey datum_rowkey;
ObStoreRowkey rowkey;
rowkey.assign(row.cells_, data_table.get_rowkey_column_num());
if (OB_ISNULL(data_tablet)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("tablet is null", K(ret), K(tablet_handle));
} else {
ObSingleRowGetter single_row_getter(*allocator, *data_tablet);
if (OB_FAIL(init_single_row_getter(single_row_getter, run_ctx, out_col_ids, data_table, true))) {
LOG_WARN("failed to init single row getter", K(ret));
} else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) {
STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(rowkey));
} else if (OB_FAIL(single_get_row(single_row_getter, datum_rowkey, duplicated_rows))) {
LOG_WARN("failed to single get row", K(ret));
}
}
if (OB_FAIL(ret)) {
if (nullptr != duplicated_rows) {
ObQueryIteratorFactory::free_insert_dup_iter(duplicated_rows);
duplicated_rows = nullptr;
}
}
return ret;
}
int ObLSTabletService::init_single_row_getter(
ObSingleRowGetter &row_getter,
ObDMLRunningCtx &run_ctx,
const ObIArray<uint64_t> &out_col_ids,
ObRelativeTable &relative_table,
bool skip_read_lob)
{
int ret = OB_SUCCESS;
if (OB_FAIL(row_getter.init_dml_access_ctx(run_ctx.store_ctx_, run_ctx.dml_param_, skip_read_lob))) {
LOG_WARN("init dml access ctx failed", K(ret));
} else if (OB_FAIL(row_getter.init_dml_access_param(relative_table,
run_ctx.dml_param_, out_col_ids, skip_read_lob))) {
LOG_WARN("init dml access param failed", K(ret));
}
return ret;
}
int ObLSTabletService::single_get_row(
ObSingleRowGetter &row_getter,
const ObDatumRowkey &rowkey,
ObNewRowIterator *&duplicated_rows)
{
int ret = OB_SUCCESS;
ObNewRow *row = nullptr;
if (OB_FAIL(row_getter.open(rowkey))) {
LOG_WARN("init single row getter failed", K(ret));
} else if (OB_FAIL(row_getter.get_next_row(row))) {
if (OB_ITER_END != ret) {
LOG_WARN("get next row from single row getter failed", K(ret));
} else {
ret = OB_SUCCESS;
}
} else if (NULL == duplicated_rows) {
ObValueRowIterator *dup_iter = NULL;
if (OB_ISNULL(dup_iter = ObQueryIteratorFactory::get_insert_dup_iter())) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("no memory to alloc ObValueRowIterator", K(ret));
} else {
duplicated_rows = dup_iter;
if (OB_FAIL(dup_iter->init(true))) {
LOG_WARN("failed to initialize ObValueRowIterator", K(ret));
}
}
}
if (OB_SUCC(ret) && row != nullptr) {
ObValueRowIterator *dup_iter = static_cast<ObValueRowIterator*>(duplicated_rows);
if (OB_FAIL(dup_iter->add_row(*row))) {
LOG_WARN("failed to store conflict row", K(ret), K(*row));
} else {
LOG_DEBUG("get conflict row", KPC(row));
}
}
return ret;
}
int ObLSTabletService::convert_row_to_rowkey(
ObSingleRowGetter &index_row_getter,
ObStoreRowkey &rowkey)
{
int ret = OB_SUCCESS;
ObNewRow *row = nullptr;
if (OB_FAIL(index_row_getter.get_next_row(row))) {
if (OB_ITER_END != ret) {
LOG_WARN("get next row from index row getter failed", K(ret));
}
} else {
rowkey.assign(row->cells_, row->count_);
}
return ret;
}
/* this func is an encapsulation of ObNewRowIterator->get_next_row.
* 1. need_copy_cells is true, perform a cells copy, but not a deep copy.
* memory for store_row.row_val.cells_ has already allocated before
* this func is invoked, no need to alloc memory in this func.
* 2. need_copy_cells is false, just perform an assignment, no any copy behavior,
*/
int ObLSTabletService::get_next_row_from_iter(
ObNewRowIterator *row_iter,
ObStoreRow &store_row,
const bool need_copy_cells)
{
int ret = OB_SUCCESS;
ObNewRow *row = nullptr;
if (OB_ISNULL(row_iter)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(row_iter));
} else if (OB_FAIL(row_iter->get_next_row(row))) {
if (OB_ITER_END != ret) {
LOG_WARN("fail to iterate a row", K(ret), K(row));
}
} else {
if (need_copy_cells) {
// in this situation, store_row.row_val has already hold mem for cells_,
// no need to alloc mem here, we copy cells only.
store_row.row_val_.count_ = row->count_;
for (int64_t i = 0; i < row->count_; ++i) {
store_row.row_val_.cells_[i] = row->cells_[i];
}
} else {
store_row.row_val_ = *row;
}
}
return ret;
}
int ObLSTabletService::insert_row_to_tablet(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
ObStoreRow &tbl_row)
{
int ret = OB_SUCCESS;
ObStoreCtx &store_ctx = run_ctx.store_ctx_;
ObRelativeTable &relative_table = run_ctx.relative_table_;
if (OB_UNLIKELY(!store_ctx.is_valid()
|| !relative_table.is_valid()
|| nullptr == run_ctx.col_descs_
|| run_ctx.col_descs_->count() <= 0
|| !tbl_row.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(store_ctx), KP(run_ctx.col_descs_), K(tbl_row), K(ret));
} else if (GCONF.enable_defensive_check()
&& OB_FAIL(check_new_row_legitimacy(run_ctx, tbl_row.row_val_))) {
LOG_WARN("check new row legitimacy failed", K(ret), K(tbl_row.row_val_));
} else if (OB_FAIL(insert_lob_tablet_row(tablet_handle, run_ctx, tbl_row))) {
LOG_WARN("failed to write lob tablets rows", K(ret));
} else {
const ObColDescIArray &col_descs = *run_ctx.col_descs_;
if (OB_FAIL(tablet_handle.get_obj()->insert_row_without_rowkey_check(
relative_table,
store_ctx,
col_descs,
tbl_row,
run_ctx.dml_param_.encrypt_meta_))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret) {
LOG_WARN("failed to write table row", K(ret),
"table id", relative_table.get_table_id(),
K(col_descs), K(tbl_row));
}
}
}
return ret;
}
int ObLSTabletService::process_old_row_lob_col(
ObTabletHandle &data_tablet_handle,
ObDMLRunningCtx &run_ctx,
ObStoreRow &tbl_row)
{
int ret = OB_SUCCESS;
run_ctx.is_old_row_valid_for_lob_ = false;
bool has_lob_col = false;
bool need_reread = is_sys_table(run_ctx.relative_table_.get_table_id());
int64_t col_cnt = run_ctx.col_descs_->count();
if (tbl_row.row_val_.count_ != col_cnt) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]Invliad row col cnt", K(ret), K(col_cnt), K(tbl_row));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) {
const ObColDesc &column = run_ctx.col_descs_->at(i);
if (is_lob_storage(column.col_type_.get_type())) {
has_lob_col = true;
need_reread = need_reread || !(tbl_row.row_val_.cells_[i].has_lob_header());
break;
}
}
}
if (OB_SUCC(ret) && has_lob_col) {
if (!need_reread) {
for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) {
const ObColDesc &column = run_ctx.col_descs_->at(i);
if (is_lob_storage(column.col_type_.get_type())) {
ObObj &obj = tbl_row.row_val_.cells_[i];
bool has_lob_header = obj.has_lob_header();
if (obj.is_null() || obj.is_nop_value()) {
// do nothing
} else if (!has_lob_header) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("lob should have lob locator here.", K(ret), K(i), K(tbl_row.row_val_.cells_[i]));
} else {
ObLobLocatorV2 lob(obj.get_string(), has_lob_header);
ObString disk_loc;
if (!lob.is_valid()) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("invalid lob locator.", K(ret), K(lob));
} else if (lob.is_simple()) {
// do nothing
} else if (OB_FAIL(lob.get_disk_locator(disk_loc))) {
LOG_WARN("failed to get disk lob locator.", K(ret), K(lob));
} else {
obj.set_lob_value(obj.get_type(), disk_loc.ptr(), disk_loc.length());
if (has_lob_header) {
obj.set_has_lob_header();
}
run_ctx.is_old_row_valid_for_lob_ = true;
}
}
}
}
} else {
if (OB_FAIL(table_refresh_row(data_tablet_handle, run_ctx, tbl_row.row_val_))) {
LOG_WARN("[STORAGE_LOB]re-read lob col failed", K(ret));
}
}
}
return ret;
}
int ObLSTabletService::table_refresh_row(
ObTabletHandle &data_tablet_handle,
ObDMLRunningCtx &run_ctx,
ObNewRow &row)
{
int ret = OB_SUCCESS;
ObArenaAllocator scan_allocator(common::ObMemAttr(MTL_ID(), ObModIds::OB_LOB_ACCESS_BUFFER));
ObTablet *data_tablet = data_tablet_handle.get_obj();
ObRelativeTable &data_table = run_ctx.relative_table_;
ObStoreRowkey rowkey;
if (OB_FAIL(rowkey.assign(row.cells_, data_table.get_rowkey_column_num()))) {
LOG_WARN("get rowkey col num failed", K(ret));
}
int64_t col_cnt = run_ctx.col_descs_->count();
ObSEArray<uint64_t, 8> out_col_ids;
for (int i = 0; OB_SUCC(ret) && i < col_cnt; ++i) {
if (OB_FAIL(out_col_ids.push_back(run_ctx.col_descs_->at(i).col_id_))) {
LOG_WARN("push col id failed.", K(ret), K(i));
}
}
ObDatumRowkey datum_rowkey;
ObDatumRowkeyHelper rowkey_helper(scan_allocator);
ObSingleRowGetter single_row_getter(scan_allocator, *data_tablet);
if (OB_FAIL(ret)) {
} else if (OB_FAIL(init_single_row_getter(single_row_getter,
run_ctx, out_col_ids, data_table, true))) {
LOG_WARN("failed to init single row getter", K(ret));
} else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) {
LOG_WARN("Failed to transfer datum rowkey", K(ret), K(rowkey));
} else {
ObNewRow *new_row = nullptr;
if (OB_FAIL(single_row_getter.open(datum_rowkey))) {
LOG_WARN("init single row getter failed", K(ret));
} else if (OB_FAIL(single_row_getter.get_next_row(new_row))) {
if (ret == OB_ITER_END) {
LOG_DEBUG("re-read old row not exist", K(ret), K(row));
ret = OB_SUCCESS;
} else {
LOG_WARN("get next row from single row getter failed", K(ret));
}
} else if (OB_ISNULL(new_row)) {
ret = OB_ERR_NULL_VALUE;
LOG_WARN("get next row from single row null", K(ret));
} else if (new_row->get_count() != row.get_count()) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("get row from single row col count not equal.", K(ret), K(row.get_count()), K(new_row->get_count()));
} else {
LOG_DEBUG("get new row success.", K(row), KPC(new_row));
// only write cells, not write row
// passing fixed double scale from row to new_row
for (int64_t i = 0; OB_SUCC(ret) && i < new_row->get_count(); ++i) {
if (row.cells_[i].is_fixed_double()) {
new_row->cells_[i].set_scale(row.cells_[i].get_scale());
} else if (OB_FAIL(ob_write_obj(run_ctx.lob_allocator_, new_row->cells_[i], row.cells_[i]))) {
LOG_WARN("copy ObObj error", K(ret), K(i), K(new_row->cells_[i]));
}
}
if (OB_SUCC(ret)) {
run_ctx.is_old_row_valid_for_lob_ = true;
}
}
}
return ret;
}
int ObLSTabletService::delete_row_in_tablet(
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx,
const ObNewRow &row)
{
int ret = OB_SUCCESS;
const ObDMLBaseParam &dml_param = run_ctx.dml_param_;
ObStoreCtx &ctx = run_ctx.store_ctx_;
ObRelativeTable &relative_table = run_ctx.relative_table_;
ObStoreRow &tbl_row = run_ctx.tbl_row_;
ObStoreRow new_tbl_row;
ObSEArray<int64_t, 8> update_idx; // update_idx is a dummy param here
tbl_row.flag_.set_flag(ObDmlFlag::DF_DELETE);
tbl_row.row_val_ = row;
if (OB_FAIL(check_old_row_legitimacy(tablet_handle, run_ctx, row))) {
if (OB_ERR_DEFENSIVE_CHECK == ret) {
dump_diag_info_for_old_row_loss(relative_table, ctx, tbl_row);
}
LOG_WARN("check old row legitimacy failed", K(row));
} else if (OB_FAIL(process_old_row_lob_col(tablet_handle, run_ctx, tbl_row))) {
LOG_WARN("failed to process old row lob col", K(ret), K(tbl_row));
} else if (OB_FAIL(delete_lob_tablet_rows(run_ctx, tablet_handle, tbl_row, row))) {
LOG_WARN("failed to delete lob rows.", K(ret), K(tbl_row), K(row));
} else if (!dml_param.is_total_quantity_log_) {
if (OB_FAIL(tablet_handle.get_obj()->insert_row_without_rowkey_check(relative_table,
ctx, *run_ctx.col_descs_, tbl_row, dml_param.encrypt_meta_))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("failed to set row", K(ret), K(*run_ctx.col_descs_), K(tbl_row));
}
}
} else {
update_idx.reset(); // update_idx is a dummy param here
new_tbl_row.reset();
new_tbl_row.flag_.set_flag(ObDmlFlag::DF_DELETE);
new_tbl_row.row_val_ = tbl_row.row_val_;
tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE);
if (OB_FAIL(tablet_handle.get_obj()->update_row(relative_table, ctx,
*run_ctx.col_descs_, update_idx, tbl_row, new_tbl_row, dml_param.encrypt_meta_))) {
if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) {
LOG_WARN("failed to set row", K(ret), K(*run_ctx.col_descs_), K(tbl_row), K(new_tbl_row));
}
} else {
LOG_DEBUG("succeeded to del main table row", K(tbl_row), K(new_tbl_row));
}
}
return ret;
}
int ObLSTabletService::delete_lob_col(
ObDMLRunningCtx &run_ctx,
const ObColDesc &column,
ObObj &obj,
const ObObj &sql_obj,
ObLobCommon *&lob_common,
ObLobAccessParam &lob_param)
{
int ret = OB_SUCCESS;
ObLobManager *lob_mngr = MTL(ObLobManager*);
if (OB_ISNULL(lob_mngr)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]get lob manager instance failed.", K(ret));
} else if (!column.col_type_.is_lob_storage() || obj.is_nop_value() || obj.is_null() ||
!run_ctx.is_old_row_valid_for_lob_) {
// do nothing
} else {
ObString data = obj.get_string();
// Notice: Only disk locator here!
ObString sql_data = sql_obj.get_string();
if (data.length() < sizeof(ObLobCommon)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]Invalid Lob data.", K(ret), K(obj), K(data));
} else {
void *buf = run_ctx.lob_allocator_.alloc(data.length());
if (OB_ISNULL(buf)) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("failed to deep copy lob data.", K(ret), K(data));
} else {
MEMCPY(buf, data.ptr(), data.length());
lob_common = reinterpret_cast<ObLobCommon*>(buf);
lob_param.tx_desc_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_;
lob_param.parent_seq_no_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_scn_;
lob_param.snapshot_ = run_ctx.dml_param_.snapshot_;
lob_param.tx_id_ = lob_param.tx_desc_->get_tx_id();
lob_param.sql_mode_ = run_ctx.dml_param_.sql_mode_;
lob_param.is_total_quantity_log_ = run_ctx.dml_param_.is_total_quantity_log_;
lob_param.ls_id_ = run_ctx.store_ctx_.ls_id_;
lob_param.tablet_id_ = run_ctx.relative_table_.get_tablet_id();
lob_param.coll_type_ = column.col_type_.get_collation_type();
lob_param.allocator_ = &run_ctx.lob_allocator_;
lob_param.lob_common_ = lob_common;
lob_param.handle_size_ = data.length();
lob_param.byte_size_ = lob_param.lob_common_->get_byte_size(data.length());
lob_param.timeout_ = run_ctx.dml_param_.timeout_;
lob_param.scan_backward_ = false;
lob_param.offset_ = 0;
// use byte size to delete all
lob_param.len_ = lob_param.byte_size_; //ObCharset::strlen_char(lob_param.coll_type_, sql_data.ptr(), sql_data.length());
if (lob_param.byte_size_ < 0) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("calc byte size is negative.", K(ret), K(data), K(lob_param));
} else if (OB_FAIL(lob_mngr->erase(lob_param))) {
LOG_WARN("[STORAGE_LOB]lob erase failed.", K(ret), K(lob_param));
}
}
}
}
return ret;
}
int ObLSTabletService::delete_lob_tablet_rows(
ObDMLRunningCtx &run_ctx,
ObTabletHandle &data_tablet,
ObStoreRow &tbl_row,
const ObNewRow &row)
{
int ret = OB_SUCCESS;
int64_t col_cnt = run_ctx.col_descs_->count();
if (tbl_row.row_val_.count_ != col_cnt) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("[STORAGE_LOB]Invliad row col cnt", K(col_cnt), K(tbl_row));
} else {
ObLobCommon *lob_common = nullptr;
for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) {
const ObColDesc &column = run_ctx.col_descs_->at(i);
if (column.col_type_.is_lob_storage()) {
ObObj &obj = tbl_row.row_val_.get_cell(i);
const ObObj &sql_obj = row.get_cell(i);
ObLobAccessParam lob_param;
if (OB_FAIL(delete_lob_col(run_ctx, column, obj, sql_obj, lob_common, lob_param))) {
LOG_WARN("[STORAGE_LOB]failed to erase lob col.", K(ret), K(i), K(tbl_row));
}
}
}
}
return ret;
}
int ObLSTabletService::prepare_scan_table_param(
ObTableScanParam &param,
share::schema::ObMultiVersionSchemaService &schema_service)
{
int ret = OB_SUCCESS;
if (NULL == param.table_param_ || OB_INVALID_ID == param.table_param_->get_table_id()) {
void *buf = NULL;
ObTableParam *table_param = NULL;
ObSchemaGetterGuard schema_guard;
const ObTableSchema *table_schema = NULL;
const uint64_t tenant_id = MTL_ID();
const bool check_formal = param.index_id_ > OB_MAX_CORE_TABLE_ID;
if (OB_FAIL(schema_service.get_tenant_schema_guard(tenant_id, schema_guard))) {
LOG_WARN("failed to get schema manager", K(ret), K(tenant_id));
} else if (check_formal && OB_FAIL(schema_guard.check_formal_guard())) {
LOG_WARN("Fail to check formal schema, ", K(param.index_id_), K(ret));
} else if (OB_FAIL(schema_guard.get_table_schema(tenant_id,
param.index_id_, table_schema))) {
LOG_WARN("Fail to get table schema", K(param.index_id_), K(ret));
} else if (NULL == table_schema) {
ret = OB_TABLE_NOT_EXIST;
LOG_WARN("table not exist", K(param.index_id_), K(ret));
} else {
if (NULL == (buf = param.allocator_->alloc(sizeof(ObTableParam)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("Fail to allocate memory, ", K(ret));
} else {
//TODO table param should not generate twice!!!!
table_param = new (buf) ObTableParam(*param.allocator_);
table_param->get_enable_lob_locator_v2() = (!IS_CLUSTER_VERSION_BEFORE_4_1_0_0);
if (OB_FAIL(table_param->convert(*table_schema, param.column_ids_, param.pd_storage_flag_))) {
LOG_WARN("Fail to convert table param, ", K(ret));
} else {
param.table_param_ = table_param;
}
}
}
}
return ret;
}
void ObLSTabletService::dump_diag_info_for_old_row_loss(
ObRelativeTable &data_table,
ObStoreCtx &store_ctx,
const ObStoreRow &tbl_row)
{
int ret = OB_SUCCESS;
ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "DumpDIAGInfo"));
ObTableAccessParam access_param;
ObTableAccessContext access_ctx;
ObSEArray<int32_t, 16> out_col_pros;
ObStoreRowkey rowkey;
ObDatumRowkey datum_rowkey;
ObDatumRowkeyHelper rowkey_helper(allocator);
const int64_t schema_rowkey_cnt = data_table.get_rowkey_column_num();
ObTableStoreIterator &table_iter = *data_table.tablet_iter_.table_iter();
ObQueryFlag query_flag(ObQueryFlag::Forward,
false, /*is daily merge scan*/
false, /*is read multiple macro block*/
false, /*sys task scan, read one macro block in single io*/
false /*is full row scan?*/,
false,
false);
common::ObVersionRange trans_version_rang;
trans_version_rang.base_version_ = 0;
trans_version_rang.multi_version_start_ = 0;
trans_version_rang.snapshot_version_ = store_ctx.mvcc_acc_ctx_.get_snapshot_version().get_val_for_tx();
const share::schema::ObTableSchemaParam *schema_param = data_table.get_schema_param();
const ObITableReadInfo *read_info = &schema_param->get_read_info();
for (int64_t i = 0; OB_SUCC(ret) && i < read_info->get_request_count(); i++) {
if (OB_FAIL(out_col_pros.push_back(i))) {
STORAGE_LOG(WARN, "Failed to push back col project", K(ret), K(i));
}
}
if (OB_FAIL(ret)) {
} else if (OB_FAIL(rowkey.assign(tbl_row.row_val_.cells_, schema_rowkey_cnt))) {
LOG_WARN("Failed to assign rowkey", K(ret));
} else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) {
STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(rowkey));
} else if (OB_FAIL(access_ctx.init(query_flag, store_ctx, allocator, trans_version_rang))) {
LOG_WARN("Fail to init access ctx", K(ret));
} else {
access_param.is_inited_ = true;
access_param.iter_param_.table_id_ = data_table.get_table_id();
access_param.iter_param_.tablet_id_ = data_table.tablet_iter_.get_tablet()->get_tablet_meta().tablet_id_;
access_param.iter_param_.read_info_ = read_info;
access_param.iter_param_.out_cols_project_ = &out_col_pros;
ObStoreRowIterator *getter = nullptr;
ObITable *table = nullptr;
const ObDatumRow *row = nullptr;
FLOG_INFO("Try to find the specified rowkey within all the sstable", K(tbl_row), K(table_iter));
FLOG_INFO("Prepare the diag env to dump the rows", K(store_ctx), K(rowkey), K(datum_rowkey),
K(access_ctx.trans_version_range_));
table_iter.resume();
while (OB_SUCC(ret)) {
if (OB_FAIL(table_iter.get_next(table))) {
if (OB_ITER_END != ret) {
LOG_WARN("failed to get next tables", K(ret));
}
} else if (OB_ISNULL(table)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("table must not be null", K(ret), K(table_iter));
} else if (OB_FAIL(table->get(access_param.iter_param_, access_ctx, datum_rowkey, getter))) {
LOG_WARN("Failed to get param", K(ret), KPC(table));
} else if (OB_FAIL(getter->get_next_row(row))) {
LOG_WARN("Failed to get next row", K(ret), KPC(table));
} else if (row->row_flag_.is_not_exist() || row->row_flag_.is_delete()){
FLOG_INFO("Cannot found rowkey in the table", KPC(row), KPC(table));
} else if (table->is_sstable()) {
FLOG_INFO("Found rowkey in the sstable",
KPC(row), KPC(reinterpret_cast<ObSSTable*>(table)));
} else {
FLOG_INFO("Found rowkey in the memtable",
KPC(row), KPC(reinterpret_cast<memtable::ObMemtable*>(table)));
}
// ignore error in the loop
if (OB_FAIL(ret) && OB_ITER_END != ret) {
ret = OB_SUCCESS;
}
if (OB_NOT_NULL(getter)) {
getter->~ObStoreRowIterator();
getter = nullptr;
}
}
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
}
if (OB_SUCC(ret)) {
FLOG_INFO("prepare to use single merge to find row", K(rowkey), K(datum_rowkey), K(access_param));
ObSingleMerge *get_merge = nullptr;
ObGetTableParam get_table_param;
ObDatumRow *row = nullptr;
get_table_param.tablet_iter_ = data_table.tablet_iter_;
void *buf = nullptr;
if (OB_ISNULL(buf = allocator.alloc(sizeof(ObSingleMerge)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("Failed to alloc memory for single merge", K(ret));
} else if (FALSE_IT(get_merge = new(buf)ObSingleMerge())) {
} else if (OB_FAIL(get_merge->init(access_param, access_ctx, get_table_param))) {
LOG_WARN("Failed to init single get merge", K(ret));
} else if (OB_FAIL(get_merge->open(datum_rowkey))) {
LOG_WARN("Failed to open single merge", K(ret));
} else if (FALSE_IT(get_merge->disable_fill_default())) {
} else {
while (OB_SUCC(get_merge->get_next_row(row))) {
FLOG_INFO("Found one row for the rowkey", KPC(row));
}
FLOG_INFO("Finish to find rowkey with single merge", K(ret), K(rowkey), K(datum_rowkey));
}
if (OB_NOT_NULL(get_merge)) {
get_merge->~ObSingleMerge();
get_merge = nullptr;
}
}
#ifdef ENABLE_DEBUG_LOG
// print single row check info
if (store_ctx.mvcc_acc_ctx_.tx_id_.is_valid()) {
transaction::ObTransService *trx = MTL(transaction::ObTransService *);
if (OB_NOT_NULL(trx)
&& NULL != trx->get_defensive_check_mgr()) {
(void)trx->get_defensive_check_mgr()->dump(store_ctx.mvcc_acc_ctx_.tx_id_);
}
}
#endif
}
}
int ObLSTabletService::prepare_dml_running_ctx(
const common::ObIArray<uint64_t> *column_ids,
const common::ObIArray<uint64_t> *upd_col_ids,
ObTabletHandle &tablet_handle,
ObDMLRunningCtx &run_ctx)
{
int ret = OB_SUCCESS;
if (OB_FAIL(run_ctx.init(
column_ids,
upd_col_ids,
MTL(ObTenantSchemaService*)->get_schema_service(),
tablet_handle))) {
LOG_WARN("failed to init run ctx", K(ret));
}
return ret;
}
int ObLSTabletService::get_ls_min_end_scn(
SCN &min_end_scn_from_latest_tablets, SCN &min_end_scn_from_old_tablets)
{
int ret = OB_SUCCESS;
const ObLSID &ls_id = ls_->get_ls_id();
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
ObSArray<ObTabletID> tablet_ids;
GetAllTabletIDOperator op(tablet_ids, true/*except_ls_inner_tablet*/);
min_end_scn_from_latest_tablets.set_max();
min_end_scn_from_old_tablets.set_max();
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_FAIL(tablet_id_set_.foreach(op))) {
STORAGE_LOG(WARN, "fail to get all tablet ids from set", K(ret));
} else {
SCN ls_checkpoint = ls_->get_clog_checkpoint_scn();
for (int64_t i = 0; OB_SUCC(ret) && i < tablet_ids.count(); ++i) {
ObTabletMapKey key(ls_id, tablet_ids.at(i));
SCN min_end_scn_from_latest = SCN::max_scn();
SCN min_end_scn_from_old = SCN::max_scn();
if (OB_FAIL(t3m->get_min_end_scn_for_ls(key,
ls_checkpoint,
min_end_scn_from_latest,
min_end_scn_from_old))) {
if (OB_ENTRY_NOT_EXIST != ret) {
LOG_WARN("fail to get min end scn", K(ret), K(key));
} else {
ret = OB_SUCCESS;
}
} else {
if (min_end_scn_from_latest < min_end_scn_from_latest_tablets) {
LOG_DEBUG("update", K(key), K(min_end_scn_from_latest_tablets), K(min_end_scn_from_latest));
min_end_scn_from_latest_tablets = min_end_scn_from_latest;
}
if (min_end_scn_from_old < min_end_scn_from_old_tablets) {
LOG_DEBUG("update", K(key), K(min_end_scn_from_old_tablets), K(min_end_scn_from_old));
min_end_scn_from_old_tablets = min_end_scn_from_old;
}
}
}
LOG_INFO("get ls min end scn finish", K(ls_checkpoint));
}
return ret;
}
int ObLSTabletService::get_multi_ranges_cost(
const ObTabletID &tablet_id,
const common::ObIArray<common::ObStoreRange> &ranges,
int64_t &total_size)
{
int ret = OB_SUCCESS;
ObTabletTableIterator iter;
const int64_t max_snapshot_version = INT64_MAX;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret));
} else if (OB_FAIL(get_read_tables(tablet_id, max_snapshot_version, iter))) {
LOG_WARN("fail to get all read tables", K(ret), K(tablet_id), K(max_snapshot_version));
} else {
ObPartitionMultiRangeSpliter spliter;
if (OB_FAIL(spliter.get_multi_range_size(
ranges,
iter.get_tablet()->get_rowkey_read_info(),
*iter.table_iter(),
total_size))) {
LOG_WARN("fail to get multi ranges cost", K(ret), K(ranges));
}
}
return ret;
}
int ObLSTabletService::split_multi_ranges(
const ObTabletID &tablet_id,
const ObIArray<ObStoreRange> &ranges,
const int64_t expected_task_count,
common::ObIAllocator &allocator,
ObArrayArray<ObStoreRange> &multi_range_split_array)
{
int ret = OB_SUCCESS;
ObTabletTableIterator iter;
const int64_t max_snapshot_version = INT64_MAX;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret));
} else if (OB_FAIL(get_read_tables(tablet_id, max_snapshot_version, iter))) {
LOG_WARN("fail to get all read tables", K(ret), K(tablet_id), K(max_snapshot_version));
} else {
ObPartitionMultiRangeSpliter spliter;
if (OB_FAIL(spliter.get_split_multi_ranges(
ranges,
expected_task_count,
iter.get_tablet()->get_rowkey_read_info(),
*iter.table_iter(),
allocator,
multi_range_split_array))) {
LOG_WARN("fail to get splitted ranges", K(ret), K(ranges), K(expected_task_count));
}
}
return ret;
}
int ObLSTabletService::estimate_row_count(
const ObTableScanParam &param,
const ObTableScanRange &scan_range,
ObIArray<ObEstRowCountRecord> &est_records,
int64_t &logical_row_count,
int64_t &physical_row_count)
{
int ret = OB_SUCCESS;
ObPartitionEst batch_est;
ObTabletTableIterator tablet_iter;
common::ObSEArray<ObITable*, 4> tables;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!param.is_estimate_valid() || !scan_range.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(ret), K(param), K(scan_range));
} else if (scan_range.is_empty()) {
} else {
const int64_t snapshot_version = -1 == param.frozen_version_ ?
GET_BATCH_ROWS_READ_SNAPSHOT_VERSION : param.frozen_version_;
if (OB_FAIL(get_read_tables(param.tablet_id_, snapshot_version, tablet_iter, false))) {
if (OB_TABLET_NOT_EXIST != ret) {
LOG_WARN("failed to get tablet_iter", K(ret), K(snapshot_version), K(param));
}
} else {
while(OB_SUCC(ret)) {
ObITable *table = nullptr;
if (OB_FAIL(tablet_iter.table_iter()->get_next(table))) {
if (OB_ITER_END != ret) {
LOG_WARN("failed to get next table", K(ret), K(tablet_iter.table_iter()));
} else {
ret = OB_SUCCESS;
break;
}
} else if (OB_ISNULL(table)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("table shoud not be null", K(ret), K(tablet_iter.table_iter()));
} else if (table->is_sstable() && static_cast<ObSSTable*>(table)->is_empty()) {
LOG_DEBUG("cur sstable is empty", K(ret), K(*table));
continue;
}
if (OB_SUCC(ret) && OB_FAIL(tables.push_back(table))) {
LOG_WARN("failed to push back table", K(ret), K(tables));
}
}
}
if (OB_SUCC(ret) && tables.count() > 0) {
ObTableEstimateBaseInput base_input(param.scan_flag_, param.index_id_, param.tx_id_, tables, tablet_iter.get_tablet_handle());
if (scan_range.is_get()) {
if (OB_FAIL(ObTableEstimator::estimate_row_count_for_get(base_input, scan_range.get_rowkeys(), batch_est))) {
LOG_WARN("failed to estimate row count", K(ret), K(param), K(scan_range));
}
} else if (OB_FAIL(ObTableEstimator::estimate_row_count_for_scan(base_input, scan_range.get_ranges(), batch_est, est_records))) {
LOG_WARN("failed to estimate row count", K(ret), K(param), K(scan_range));
}
}
}
if (OB_SUCC(ret)) {
logical_row_count = batch_est.logical_row_count_;
physical_row_count = batch_est.physical_row_count_;
}
LOG_DEBUG("estimate result", K(ret), K(batch_est), K(est_records));
return ret;
}
int ObLSTabletService::estimate_block_count_and_row_count(
const common::ObTabletID &tablet_id,
int64_t &macro_block_count,
int64_t &micro_block_count,
int64_t &sstable_row_count,
int64_t &memtable_row_count,
common::ObIArray<int64_t> &cg_macro_cnt_arr,
common::ObIArray<int64_t> &cg_micro_cnt_arr)
{
int ret = OB_SUCCESS;
macro_block_count = 0;
micro_block_count = 0;
sstable_row_count = 0;
memtable_row_count = 0;
ObTabletTableIterator tablet_iter;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_FAIL(get_read_tables(tablet_id, INT64_MAX, tablet_iter, false/*allow_no_ready_read*/))) {
LOG_WARN("failed to get read tables", K(ret));
}
ObITable *table = nullptr;
ObSSTable *sstable = nullptr;
cg_macro_cnt_arr.reset();
cg_micro_cnt_arr.reset();
while (OB_SUCC(ret)) {
ObSSTableMetaHandle sst_meta_hdl;
if (OB_FAIL(tablet_iter.table_iter()->get_next(table))) {
if (OB_ITER_END != ret) {
LOG_WARN("failed to get next tables", K(ret));
} else {
ret = OB_SUCCESS;
break;
}
} else if (OB_ISNULL(table)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("get unexpected null table", K(ret), K(tablet_iter.table_iter()));
} else if (table->is_memtable()) {
memtable_row_count += static_cast<memtable::ObMemtable *>(table)->get_physical_row_cnt();
} else if (table->is_sstable()) {
sstable = static_cast<ObSSTable *>(table);
if (OB_FAIL(sstable->get_meta(sst_meta_hdl))) {
LOG_WARN("fail to get sstable meta handle", K(ret));
} else {
sstable = static_cast<ObSSTable *>(table);
macro_block_count += sstable->get_data_macro_block_count();
micro_block_count += sst_meta_hdl.get_sstable_meta().get_data_micro_block_count();
sstable_row_count += sst_meta_hdl.get_sstable_meta().get_row_count();
}
}
if (OB_SUCC(ret) && table->is_co_sstable()) {
ObCOSSTableV2 *co_sstable = static_cast<ObCOSSTableV2 *>(table);
common::ObArray<ObITable *> tables;
if (OB_FAIL(co_sstable->get_all_tables(tables))) {
LOG_WARN("fail to get all tables", K(ret), KPC(co_sstable));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < tables.count(); i++) {
ObITable *cg_table = tables.at(i);
ObSSTableMetaHandle co_sst_meta_hdl;
if (OB_UNLIKELY(cg_table == nullptr || !cg_table->is_sstable())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected cg table", K(ret), KPC(cg_table));
} else if (FALSE_IT(sstable = static_cast<ObSSTable *>(cg_table))) {
} else if (OB_FAIL(sstable->get_meta(co_sst_meta_hdl))) {
LOG_WARN("fail to get sstable meta handle", K(ret));
} else if (OB_FAIL(cg_macro_cnt_arr.push_back(sstable->get_data_macro_block_count()))) {
LOG_WARN("fail to push macro count", K(ret));
} else if (OB_FAIL(cg_micro_cnt_arr.push_back(co_sst_meta_hdl.get_sstable_meta().get_data_micro_block_count()))) {
LOG_WARN("fail to push micro count", K(ret));
}
}
}
}
}
return ret;
}
int ObLSTabletService::get_tx_data_memtable_mgr(ObMemtableMgrHandle &mgr_handle)
{
mgr_handle.reset();
return mgr_handle.set_memtable_mgr(&tx_data_memtable_mgr_);
}
int ObLSTabletService::get_tx_ctx_memtable_mgr(ObMemtableMgrHandle &mgr_handle)
{
mgr_handle.reset();
return mgr_handle.set_memtable_mgr(&tx_ctx_memtable_mgr_);
}
int ObLSTabletService::get_lock_memtable_mgr(ObMemtableMgrHandle &mgr_handle)
{
mgr_handle.reset();
return mgr_handle.set_memtable_mgr(&lock_memtable_mgr_);
}
int ObLSTabletService::get_mds_table_mgr(mds::MdsTableMgrHandle &mgr_handle)
{
mgr_handle.reset();
return mgr_handle.set_mds_table_mgr(&mds_table_mgr_);
}
int ObLSTabletService::create_ls_inner_tablet(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id,
const SCN &major_frozen_scn,
const share::schema::ObTableSchema &table_schema,
const lib::Worker::CompatMode &compat_mode,
const SCN &create_scn)
{
int ret = OB_SUCCESS;
bool b_exist = false;
ObTabletHandle tablet_handle;
common::ObTabletID empty_tablet_id;
ObMetaDiskAddr disk_addr;
const int64_t snapshot_version = major_frozen_scn.get_val_for_tx();
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!ls_id.is_valid())
|| OB_UNLIKELY(!tablet_id.is_valid())
|| OB_UNLIKELY(!major_frozen_scn.is_valid())
|| OB_UNLIKELY(!table_schema.is_valid())
|| OB_UNLIKELY(lib::Worker::CompatMode::INVALID == compat_mode)
|| OB_UNLIKELY(!create_scn.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ls_id), K(tablet_id), K(major_frozen_scn),
K(table_schema), K(compat_mode), K(create_scn));
} else if (OB_UNLIKELY(ls_id != ls_->get_ls_id())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("ls id is unexpected", K(ret), "arg_ls_id", ls_id, "ls_id", ls_->get_ls_id());
} else if (OB_UNLIKELY(!tablet_id.is_ls_inner_tablet())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("tablet id is not ls inner tablet", K(ret), K(tablet_id));
} else if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) {
LOG_WARN("failed to check tablet existence", K(ret), K(ls_id), K(tablet_id));
} else if (OB_UNLIKELY(b_exist)) {
ret = OB_TABLET_EXIST;
LOG_WARN("tablet already exists", K(ret), K(ls_id), K(tablet_id));
} else if (OB_FAIL(create_inner_tablet(ls_id, tablet_id, tablet_id/*data_tablet_id*/,
create_scn, snapshot_version, table_schema, compat_mode, tablet_handle))) {
LOG_WARN("failed to do create tablet", K(ret), K(ls_id), K(tablet_id),
K(create_scn), K(major_frozen_scn), K(table_schema), K(compat_mode));
}
return ret;
}
int ObLSTabletService::remove_ls_inner_tablet(
const share::ObLSID &ls_id,
const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
common::ObSEArray<common::ObTabletID, 1> tablet_id_array;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else if (OB_UNLIKELY(!ls_id.is_valid())
|| OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid args", K(ret), K(ls_id), K(tablet_id));
} else if (OB_UNLIKELY(ls_id != ls_->get_ls_id())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("ls id is unexpected", K(ret), "arg_ls_id", ls_id, "ls_id", ls_->get_ls_id());
} else if (OB_FAIL(do_remove_tablet(ObTabletMapKey(ls_id, tablet_id)))) {
LOG_WARN("failed to remove tablet", K(ret), K(ls_id), K(tablet_id));
}
return ret;
}
int ObLSTabletService::build_tablet_iter(ObLSTabletIterator &iter, const bool except_ls_inner_tablet)
{
int ret = common::OB_SUCCESS;
GetAllTabletIDOperator op(iter.tablet_ids_, except_ls_inner_tablet);
iter.ls_tablet_service_ = this;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
STORAGE_LOG(WARN, "not inited", K(ret), K_(is_inited));
} else if (OB_FAIL(tablet_id_set_.foreach(op))) {
STORAGE_LOG(WARN, "fail to get all tablet ids from set", K(ret));
} else if (OB_UNLIKELY(!iter.is_valid())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("iter is invalid", K(ret), K(iter));
}
if (OB_FAIL(ret)) {
iter.reset();
}
return ret;
}
int ObLSTabletService::build_tablet_iter(ObHALSTabletIDIterator &iter)
{
int ret = common::OB_SUCCESS;
GetAllTabletIDOperator op(iter.tablet_ids_);
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
STORAGE_LOG(WARN, "not inited", K(ret), K_(is_inited));
} else if (OB_FAIL(tablet_id_set_.foreach(op))) {
STORAGE_LOG(WARN, "fail to get all tablet ids from set", K(ret));
} else if (OB_UNLIKELY(!iter.is_valid())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("iter is invalid", K(ret), K(iter));
}
if (OB_FAIL(ret)) {
iter.reset();
}
return ret;
}
int ObLSTabletService::build_tablet_iter(ObHALSTabletIterator &iter)
{
int ret = common::OB_SUCCESS;
iter.ls_tablet_service_ = this;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
STORAGE_LOG(WARN, "not inited", K(ret), K_(is_inited));
} else if (OB_FAIL(build_tablet_iter(iter.tablet_id_iter_))) {
STORAGE_LOG(WARN, "fail to build ha tablet id iterator", K(ret));
}
if (OB_FAIL(ret)) {
iter.reset();
}
return ret;
}
int ObLSTabletService::set_allow_to_read_(ObLS *ls)
{
int ret = OB_SUCCESS;
ObMigrationStatus migration_status = ObMigrationStatus::OB_MIGRATION_STATUS_MAX;
share::ObLSRestoreStatus restore_status;
if (OB_ISNULL(ls)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("set allow to read get invalid argument", K(ret), KP(ls));
} else {
if (OB_FAIL(ls->get_migration_and_restore_status(migration_status, restore_status))) {
LOG_WARN("failed to get ls migration and restore status", K(ret), KPC(ls));
} else if ((ObMigrationStatus::OB_MIGRATION_STATUS_NONE != migration_status
&& ObMigrationStatus::OB_MIGRATION_STATUS_HOLD != migration_status)
|| ObLSRestoreStatus::RESTORE_NONE != restore_status) {
allow_to_read_mgr_.disable_to_read();
FLOG_INFO("set ls do not allow to read", KPC(ls), K(migration_status), K(restore_status));
} else {
allow_to_read_mgr_.enable_to_read();
}
}
return ret;
}
void ObLSTabletService::enable_to_read()
{
allow_to_read_mgr_.enable_to_read();
}
void ObLSTabletService::disable_to_read()
{
allow_to_read_mgr_.disable_to_read();
}
int ObLSTabletService::GetAllTabletIDOperator::operator()(const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!tablet_id.is_valid())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id));
} else if (except_ls_inner_tablet_ && tablet_id.is_ls_inner_tablet()) {
// do nothing
} else if (OB_FAIL(tablet_ids_.push_back(tablet_id))) {
LOG_WARN("failed to push back tablet id", K(ret), K(tablet_id));
}
return ret;
}
int ObLSTabletService::DestroyMemtableAndMemberAndMdsTableOperator::operator()(const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*);
cur_tablet_id_ = tablet_id;
if (OB_UNLIKELY(!tablet_id.is_valid()) || OB_ISNULL(tablet_svr_)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_svr_));
} else if (OB_ISNULL(tablet_svr_->ls_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("ls is null", K(ret));
} else {
const ObTabletMapKey key(tablet_svr_->ls_->get_ls_id(), tablet_id);
if (OB_FAIL(t3m->release_memtable_and_mds_table_for_ls_offline(key))) {
LOG_WARN("failed to release memtables and mds table", K(ret), K(key));
}
}
return ret;
}
int ObLSTabletService::SetMemtableFrozenOperator::operator()(const common::ObTabletID &tablet_id)
{
int ret = OB_SUCCESS;
ObTabletHandle handle;
cur_tablet_id_ = tablet_id;
if (OB_UNLIKELY(!tablet_id.is_valid()) || OB_ISNULL(tablet_svr_)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_svr_));
} else if (OB_FAIL(tablet_svr_->get_tablet(tablet_id,
handle,
ObTabletCommon::DEFAULT_GET_TABLET_NO_WAIT,
ObMDSGetTabletMode::READ_WITHOUT_CHECK))) {
if (OB_TABLET_NOT_EXIST == ret) {
LOG_WARN("failed to get tablet, skip set memtable frozen", K(ret), K(tablet_id));
ret = OB_SUCCESS;
} else {
LOG_ERROR("failed to get tablet", K(ret), K(tablet_id));
}
} else if (OB_FAIL(handle.get_obj()->set_frozen_for_all_memtables())) {
LOG_WARN("failed to set frozen for all memtables", K(ret), K(tablet_id));
}
return ret;
}
void ObLSTabletService::AllowToReadMgr::disable_to_read()
{
AllowToReadInfo read_info;
AllowToReadInfo next_read_info;
do {
LOAD128(read_info, &read_info_);
if (!read_info.allow_to_read()) {
break;
} else {
next_read_info.info_.allow_to_read_ = 0;
next_read_info.info_.seq_ = read_info.info_.seq_ + 1;
}
} while (!CAS128(&read_info_, read_info, next_read_info));
}
void ObLSTabletService::AllowToReadMgr::enable_to_read()
{
AllowToReadInfo read_info;
AllowToReadInfo next_read_info;
do {
LOAD128(read_info, &read_info_);
if (read_info.allow_to_read()) {
break;
} else {
next_read_info.info_.allow_to_read_ = 1;
next_read_info.info_.seq_ = read_info.info_.seq_;
}
} while (!CAS128(&read_info_, read_info, next_read_info));
}
void ObLSTabletService::AllowToReadMgr::load_allow_to_read_info(
AllowToReadInfo &read_info)
{
LOAD128(read_info, &read_info_);
}
void ObLSTabletService::AllowToReadMgr::check_read_info_same(
const AllowToReadInfo &read_info, bool &is_same)
{
AllowToReadInfo current_read_info;
LOAD128(current_read_info, &read_info_);
is_same = read_info == current_read_info;
}
int ObLSTabletService::get_all_tablet_ids(
const bool except_ls_inner_tablet,
common::ObIArray<ObTabletID> &tablet_id_array)
{
int ret = OB_SUCCESS;
GetAllTabletIDOperator op(tablet_id_array, except_ls_inner_tablet);
if (OB_FAIL(tablet_id_set_.foreach(op))) {
LOG_WARN("failed to traverse tablet id set", K(ret));
}
return ret;
}
int ObLSTabletService::flush_mds_table(int64_t recycle_scn)
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("ls tablet service is not init", KR(ret), KPC(this));
} else if (OB_FAIL(mds_table_mgr_.flush(SCN::max_scn(), true))) {
LOG_WARN("flush mds table failed", KR(ret), KPC(this));
}
LOG_INFO("finish flush mds table", KR(ret), K(recycle_scn));
return ret;
}
int ObLSTabletService::set_frozen_for_all_memtables()
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else {
SetMemtableFrozenOperator set_mem_frozen_op(this);
if (OB_FAIL(tablet_id_set_.foreach(set_mem_frozen_op))) {
LOG_WARN("fail to set memtables frozen", K(ret), K(set_mem_frozen_op.cur_tablet_id_));
}
}
return ret;
}
int ObLSTabletService::ha_scan_all_tablets(const HandleTabletMetaFunc &handle_tablet_meta_f)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!is_inited_)) {
ret = OB_NOT_INIT;
LOG_WARN("not inited", K(ret), K_(is_inited));
} else {
ObHALSTabletIterator iterator(ls_->get_ls_id(), false/* need_initial_state */);
if (OB_FAIL(build_tablet_iter(iterator))) {
LOG_WARN("fail to build tablet iterator", K(ret), KPC(this));
} else {
ObTabletHandle tablet_handle;
ObTablet *tablet = nullptr;
obrpc::ObCopyTabletInfo tablet_info;
ObTabletCreateDeleteMdsUserData user_data;
bool committed_flag = false;
while (OB_SUCC(ret)) {
tablet_info.reset();
user_data.reset();
committed_flag = false;
if (OB_FAIL(iterator.get_next_tablet(tablet_handle))) {
if (OB_ITER_END == ret) {
ret = OB_SUCCESS;
break;
} else {
LOG_WARN("failed to get tablet", K(ret));
}
} else if (OB_ISNULL(tablet = tablet_handle.get_obj())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("tablet is nullptr", K(ret), K(tablet_handle));
} else if (OB_FAIL(tablet->ObITabletMdsInterface::get_latest_tablet_status(user_data, committed_flag))) {
if (OB_EMPTY_RESULT == ret) {
ret = OB_SUCCESS;
} else {
LOG_WARN("failed to get latest tablet status", K(ret), KPC(tablet));
}
} else if (!committed_flag && ObTabletStatus::TRANSFER_IN == user_data.tablet_status_) {
//TODO(muwei.ym) CAN NOT USE this condition when MDS supports uncommitted transaction
// why we should skip uncommited transfer in tablet, because if we backup the uncommited transfer in tablet
// but the final result of the uncommited transfer in tablet is aborted, which means the tablet has no MDS Table,
// and the restore process will create this tablet nontheless, however this aborted tablet should be GC-ed at the end,
// because the aborted tablet has no MDS Table, the tablet can not be GC-ed correctly, resulting in the tablet dangling
// for details, see issue-51990749
// we can skip backup uncommited transfer in tablets because we backup ls meta first
// if the start transfer in transaction is not commited, the clog_checkpoint_scn recorded
// in ls meta will not be advanced, so that even though we skip backup uncommited
// transfer in tablet, we can still restore transfer in tablet by replaying clog
LOG_WARN("tablet is transfer in but not commited, skip", K(tablet_handle), K(user_data));
continue;
} else if (OB_FAIL(tablet->build_migration_tablet_param(tablet_info.param_))) {
LOG_WARN("failed to build migration tablet param", K(ret));
} else if (OB_FAIL(tablet->get_ha_sstable_size(tablet_info.data_size_))) {
LOG_WARN("failed to get sstable size", K(ret), KPC(tablet));
} else if (OB_FAIL(ObStorageHAUtils::get_server_version(tablet_info.version_))) {
LOG_WARN("failed to get server version", K(ret), K(tablet_info));
} else {
tablet_info.tablet_id_ = tablet->get_tablet_meta().tablet_id_;
tablet_info.status_ = ObCopyTabletStatus::TABLET_EXIST;
if (OB_FAIL(handle_tablet_meta_f(tablet_info))) {
LOG_WARN("fail to handle tablet meta", K(ret), K(tablet_info));
}
}
}
}
}
return ret;
}
int ObLSTabletService::ha_get_tablet(
const common::ObTabletID &tablet_id,
ObTabletHandle &handle)
{
int ret = OB_SUCCESS;
bool is_empty_shell = false;
ObTablet *tablet = nullptr;
if (OB_FAIL(direct_get_tablet(tablet_id, handle))) {
LOG_WARN("failed to get tablet", K(ret), K(tablet_id));
} else if (OB_ISNULL(tablet = handle.get_obj())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("tablet should not be NULL", K(ret), K(tablet_id));
} else if (tablet->is_empty_shell()) {
// treat empty shell as tablet not exist.
ret = OB_TABLET_NOT_EXIST;
}
return ret;
}
int ObLSTabletService::check_real_leader_for_4377_(const ObLSID ls_id)
{
int ret = OB_SUCCESS;
ObLSService* ls_srv = nullptr;
ObLSHandle ls_handle;
ObLS *ls = nullptr;
int64_t epoch = 0;
bool is_real_leader = false;
if (OB_ISNULL(ls_srv = MTL(ObLSService*))) {
ret = OB_ERR_UNEXPECTED;
LOG_ERROR("MTL(ObLSService*) fail, MTL not init?", K(ret));
} else if (OB_FAIL(ls_srv->get_ls(ls_id,
ls_handle,
ObLSGetMod::TRANS_MOD))) {
LOG_ERROR("ls_srv->get_ls() fail", KR(ret));
} else if (OB_ISNULL(ls = ls_handle.get_ls())) {
ret = OB_ERR_UNEXPECTED;
LOG_ERROR("invalid ls", KR(ret));
} else if (OB_FAIL(ls->get_tx_svr()->get_tx_ls_log_adapter()->get_role(is_real_leader, epoch))) {
LOG_WARN("get replica status fail", K(ret), KPC(ls));
} else if (!is_real_leader) {
ret = OB_NOT_MASTER;
LOG_WARN("get follower status during 4377", K(ret), KPC(ls));
}
return ret;
}
int ObLSTabletService::check_need_rollback_in_transfer_for_4377_(const transaction::ObTxDesc *tx_desc,
ObTabletHandle &data_tablet_handle)
{
int ret = OB_SUCCESS;
ObTabletCreateDeleteMdsUserData user_data;
bool unused_committed_flag = false;
if (OB_ISNULL(tx_desc)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("tx_desc is null when check 4377", K(ret));
} else if (OB_FAIL(data_tablet_handle.get_obj()->ObITabletMdsInterface::get_latest_tablet_status(
user_data, unused_committed_flag))) {
LOG_WARN("can not get the tablet status from ObITabletMdsInterface", K(ret));
} else {
// ObTabletStatus tablet_status = user_data.tablet_status_;
// CASE 1: tablet_status_ == NORMAL, means there's no transfer in progress right now.
// If there's valid transfer_scn_, which means transfer has finished, we should check
// whether the transaction started before transfer to avoid throwing incorrect 4377
// error. Otherwise, it's a normal case of 4377 check because no transfer has happened,
// and we should still throw 4377 error.
//
// CASE 2: tablet_status_ == TRANSFER_OUT, means it's in transfer out progress.
// CASE 2.1: transfer_scn_ is invalid, the transfer_scn_ is not backfilled, we still
// read from origin tablet, if there's inconsistent, it should throw 4377 error
// CASE 2.2: transfer_scn_ is valid, the transfer_scn_ is backfilled, it means that
// tablet has started to transfer out. If it's the first transfer, we should
// throw 4377 error, otherwise we should compare the transfer_scn_ with the tx_scn,
// and decide to rollback the transaction or throw 4377 error.
// However, we can not be sure about whether this transfer out is the first transfer or not.
// So we consider all the transfer out status as not the first transfer here, to avoid
// throwing the incorrect 4377 error.
//
// CASE 3: tablet_status_ == TRANSFER_IN, means it's in transfer in progress, and
// the transfer out progress must have been finished. We can compare the transfer_scn_
// with the tx_scn directly because there should be valid transfer_scn_.
//
// Above all, we do not need to consider the status of tablet.
if (user_data.transfer_scn_.is_valid()) {
if (user_data.transfer_scn_.convert_to_ts() > tx_desc->get_active_ts()) {
// TODO(yangyifei.yyf): active_ts is set by ObClockGenerator::get_clock, it's not a GTS.
// And transfer_scn is set by redo_scn, it's incorrect to compare it with active_ts.
// We should adjust this judgment later.
ret = OB_TRANS_NEED_ROLLBACK;
LOG_WARN("maybe meet transfer during kill tx, which can cause 4377 error, so we will rollback it",
K(tx_desc),
K(user_data));
}
} else {
// There's no transfer after trans begin, still throw 4377 error
}
}
return ret;
}
int ObLSTabletService::check_parts_tx_state_in_transfer_for_4377_(transaction::ObTxDesc *tx_desc)
{
int ret = OB_SUCCESS;
transaction::ObTransService *txs = MTL(transaction::ObTransService *);
transaction::ObTxPartList copy_parts;
bool is_alive = false;
if (OB_ISNULL(tx_desc)) {
ret = OB_ERR_UNEXPECTED;
LOG_ERROR("tx_desc is null", K(ret));
} else if (OB_FAIL(tx_desc->get_parts_copy(copy_parts))) {
TRANS_LOG(WARN, "get participants copy error", K(ret));
} else {
// Although we can verify whether transaction data is incomplete due to the
// transfer by checking the local tablet. While in the scenario where we
// validate the index table through the main table, we cannot discover
// whether the main table's txn data is incomplete due to the transfer by
// using the local index table. Furthermore, the local index table and the
// main table may not even locate on the same machine.
//
// Therefore, we choose to traverse all participant lists through RPC to
// confirm whether the txn context that could potentially participate in the
// transfer and has been terminated due to the transfer. In this scenario,
// we consider the occurrence of 4377 as misreporting, and we convert it
// into OB_TRANS_NEED_ROLLBACK to indicate the need to rollback the txn.
for (int64_t i = 0; OB_SUCC(ret) && i < copy_parts.count(); i++) {
ObLSID ls_id = copy_parts[i].id_;
is_alive = false;
if (OB_FAIL(txs->ask_tx_state_for_4377(ls_id,
tx_desc->get_tx_id(),
is_alive))) {
TRANS_LOG(WARN, "fail to ask tx state for 4377", K(tx_desc));
} else if (!is_alive) {
ret = OB_TRANS_NEED_ROLLBACK;
LOG_WARN("maybe meet transfer during kill tx, which can cause 4377 error, so we will rollback it",
K(tx_desc));
}
}
}
return ret;
}
int ObLSTabletService::offline_build_tablet_without_memtable_()
{
int ret = OB_SUCCESS;
ObArray<ObTabletID> tablet_id_array;
const bool except_ls_inner_tablet = false;
const SCN scn(SCN::max_scn());
if (OB_FAIL(get_all_tablet_ids(except_ls_inner_tablet, tablet_id_array))) {
LOG_WARN("failed to get all tablet ids", K(ret));
} else {
for (int64_t i = 0; OB_SUCC(ret) && i < tablet_id_array.count(); ++i) {
const ObTabletID &tablet_id = tablet_id_array.at(i);
if (OB_FAIL(update_tablet_release_memtable_for_offline(tablet_id, scn))) {
LOG_WARN("failed to update tablet release memtable", K(ret), K(tablet_id));
}
}
}
return ret;
}
int ObLSTabletService::offline_destroy_memtable_and_mds_table_()
{
int ret = OB_SUCCESS;
DestroyMemtableAndMemberAndMdsTableOperator clean_mem_op(this);
if (OB_FAIL(tablet_id_set_.foreach(clean_mem_op))) {
LOG_WARN("fail to clean memtables", K(ret), "cur_tablet_id", clean_mem_op.cur_tablet_id_);
}
return ret;
}
} // namespace storage
} // namespace oceanbase