/** * Copyright (c) 2021 OceanBase * OceanBase CE is licensed under Mulan PubL v2. * You can use this software according to the terms and conditions of the Mulan PubL v2. * You may obtain a copy of Mulan PubL v2 at: * http://license.coscl.org.cn/MulanPubL-2.0 * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. * See the Mulan PubL v2 for more details. */ #define USING_LOG_PREFIX STORAGE #include "storage/ls/ob_ls_tablet_service.h" #include "common/row/ob_row_store.h" #include "lib/objectpool/ob_server_object_pool.h" #include "lib/utility/ob_macro_utils.h" #include "lib/utility/utility.h" #include "logservice/ob_log_base_header.h" #include "logservice/ob_log_base_type.h" #include "logservice/ob_log_service.h" #include "share/scn.h" #include "observer/report/ob_i_meta_report.h" #include "share/ob_disk_usage_table_operator.h" #include "share/rc/ob_tenant_base.h" #include "share/schema/ob_table_param.h" #include "share/schema/ob_table_dml_param.h" #include "share/schema/ob_tenant_schema_service.h" #include "share/ob_ddl_common.h" #include "storage/blocksstable/index_block/ob_index_block_builder.h" #include "storage/blocksstable/ob_sstable_meta.h" #include "storage/ob_dml_running_ctx.h" #include "storage/ob_partition_range_spliter.h" #include "storage/ob_query_iterator_factory.h" #include "storage/ob_relative_table.h" #include "storage/ob_row_reshape.h" #include "storage/ob_storage_struct.h" #include "storage/ob_storage_table_guard.h" #include "storage/ob_value_row_iterator.h" #include "storage/access/ob_table_scan_iterator.h" #include "storage/access/ob_table_scan_range.h" #include "storage/access/ob_rows_info.h" #include "storage/access/ob_table_scan_range.h" #include "storage/access/ob_rows_info.h" #include "storage/access/ob_table_estimator.h" #include "storage/access/ob_index_sstable_estimator.h" #include "storage/column_store/ob_column_oriented_sstable.h" #include "storage/blocksstable/ob_sstable.h" #include "storage/ls/ob_ls.h" #include "storage/tablet/ob_tablet.h" #include "storage/tablet/ob_tablet_iterator.h" #include "storage/tablet/ob_tablet_binding_helper.h" #include "storage/tablet/ob_tablet_create_delete_helper.h" #include "storage/tablet/ob_tablet_create_sstable_param.h" #include "storage/tablet/ob_tablet_persister.h" #include "storage/tablet/ob_tablet_service_clog_replay_executor.h" #include "storage/tablet/ob_tablet_status.h" #include "storage/tablet/ob_tablet_slog_helper.h" #include "storage/tablet/ob_tablet_persister.h" #include "storage/tx/ob_trans_define.h" #include "storage/tx/ob_trans_part_ctx.h" #include "storage/tx_storage/ob_ls_service.h" #include "storage/meta_mem/ob_tablet_map_key.h" #include "storage/meta_mem/ob_tenant_meta_mem_mgr.h" #include "storage/slog/ob_storage_log_replayer.h" #include "storage/slog/ob_storage_log_struct.h" #include "storage/slog/ob_storage_logger.h" #include "share/ob_lob_access_utils.h" #include "observer/table_load/ob_table_load_table_ctx.h" #include "observer/table_load/ob_table_load_coordinator.h" #include "observer/table_load/ob_table_load_service.h" #include "observer/table_load/ob_table_load_store.h" #include "observer/ob_server_event_history_table_operator.h" #include "storage/high_availability/ob_storage_ha_utils.h" using namespace oceanbase::share; using namespace oceanbase::common; using namespace oceanbase::transaction; using namespace oceanbase::blocksstable; using namespace oceanbase::observer; namespace oceanbase { namespace storage { using namespace mds; ObLSTabletService::ObLSTabletService() : ls_(nullptr), tx_data_memtable_mgr_(), tx_ctx_memtable_mgr_(), lock_memtable_mgr_(), mds_table_mgr_(), tablet_id_set_(), bucket_lock_(), allow_to_read_mgr_(), is_inited_(false), is_stopped_(false) { } ObLSTabletService::~ObLSTabletService() { } int ObLSTabletService::init( ObLS *ls) { int ret = OB_SUCCESS; if (OB_UNLIKELY(is_inited_)) { ret = OB_INIT_TWICE; LOG_WARN("init twice", K(ret), K_(is_inited)); } else if (OB_ISNULL(ls)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ls)); } else if (OB_FAIL(tablet_id_set_.init(ObTabletCommon::BUCKET_LOCK_BUCKET_CNT, MTL_ID()))) { LOG_WARN("fail to init tablet id set", K(ret)); } else if (OB_FAIL(bucket_lock_.init(ObTabletCommon::BUCKET_LOCK_BUCKET_CNT, ObLatchIds::TABLET_BUCKET_LOCK, "TabletSvrBucket", MTL_ID()))) { LOG_WARN("failed to init bucket lock", K(ret)); } else if (OB_FAIL(set_allow_to_read_(ls))) { LOG_WARN("failed to set allow to read", K(ret)); } else if (OB_FAIL(mds_table_mgr_.init(ls))) { LOG_WARN("fail to init mds table mgr", KR(ret)); } else { ls_ = ls; is_stopped_ = false; is_inited_ = true; } if (OB_UNLIKELY(!is_inited_)) { destroy(); } return ret; } void ObLSTabletService::destroy() { delete_all_tablets(); tablet_id_set_.destroy(); tx_data_memtable_mgr_.destroy(); tx_ctx_memtable_mgr_.destroy(); lock_memtable_mgr_.destroy(); mds_table_mgr_.destroy(); bucket_lock_.destroy(); ls_= nullptr; is_stopped_ = false; is_inited_ = false; } int ObLSTabletService::stop() { int ret = OB_SUCCESS; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else { is_stopped_ = true; } return ret; } int ObLSTabletService::offline() { int ret = OB_SUCCESS; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_FAIL(offline_build_tablet_without_memtable_())) { LOG_WARN("failed to offline build tablet without memtable", K(ret)); } else if (OB_FAIL(offline_destroy_memtable_and_mds_table_())) { LOG_WARN("failed to offline destroy memtable and mds table", K(ret)); } else { mds_table_mgr_.offline(); } return ret; } int ObLSTabletService::online() { return OB_SUCCESS; } int ObLSTabletService::replay( const void *buffer, const int64_t nbytes, const palf::LSN &lsn, const SCN &scn) { int ret = OB_SUCCESS; int64_t pos = 0; logservice::ObLogBaseHeader base_header; common::ObTabletID tablet_id; const char *log_buf = static_cast(buffer); ObTabletServiceClogReplayExecutor replayer_executor; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_FAIL(base_header.deserialize(log_buf, nbytes, pos))) { LOG_WARN("log base header deserialize error", K(ret)); } else if (logservice::ObLogBaseType::STORAGE_SCHEMA_LOG_BASE_TYPE != base_header.get_log_type()) { ret = OB_NOT_SUPPORTED; LOG_WARN("log type not supported", K(ret), "log_type", base_header.get_log_type()); } else if (OB_FAIL(tablet_id.deserialize(log_buf, nbytes, pos))) { LOG_WARN("fail to deserialize tablet id", K(ret), KP(log_buf), K(nbytes), K(pos)); } else if (OB_FAIL(replayer_executor.init(log_buf, nbytes, pos, scn))) { LOG_WARN("failed to init replayer", K(ret), KP(log_buf), K(nbytes), K(pos), K(lsn), K(scn)); } else if (OB_FAIL(replayer_executor.execute(scn, ls_->get_ls_id(), tablet_id))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_SUCCESS; // TODO (bowen.gbw): unify multi data replay logic LOG_INFO("tablet does not exist, skip", K(ret), K(replayer_executor)); } else if (OB_TIMEOUT == ret) { LOG_INFO("replace timeout errno", KR(ret), K(replayer_executor)); ret = OB_EAGAIN; } else { LOG_WARN("failed to replay", K(ret), K(replayer_executor)); } } return ret; } void ObLSTabletService::switch_to_follower_forcedly() { // TODO } int ObLSTabletService::switch_to_leader() { int ret = OB_SUCCESS; //TODO return ret; } int ObLSTabletService::switch_to_follower_gracefully() { int ret = OB_SUCCESS; //TODO return ret; } int ObLSTabletService::resume_leader() { int ret = OB_SUCCESS; //TODO return ret; } int ObLSTabletService::flush(SCN &recycle_scn) { UNUSED(recycle_scn); return OB_SUCCESS; } SCN ObLSTabletService::get_rec_scn() { return SCN::max_scn(); } int ObLSTabletService::prepare_for_safe_destroy() { int ret = OB_SUCCESS; if (OB_FAIL(delete_all_tablets())) { LOG_WARN("fail to delete all tablets", K(ret)); } #ifdef ERRSIM if (!ls_->get_ls_id().is_sys_ls()) { SERVER_EVENT_SYNC_ADD("ls_tablet_service", "after_delete_all_tablets", "tenant_id", MTL_ID(), "ls_id", ls_->get_ls_id().id()); DEBUG_SYNC(AFTER_LS_GC_DELETE_ALL_TABLETS); } #endif return ret; } int ObLSTabletService::safe_to_destroy(bool &is_safe) { int ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); is_safe = true; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else { int64_t tx_data_memtable_mgr_ref = tx_data_memtable_mgr_.get_ref(); int64_t tx_ctx_memtable_mgr_ref = tx_ctx_memtable_mgr_.get_ref(); int64_t lock_memtable_mgr_ref = lock_memtable_mgr_.get_ref(); int64_t mds_table_mgr_ref = mds_table_mgr_.get_ref(); if (0 != tx_data_memtable_mgr_ref || 0 != tx_ctx_memtable_mgr_ref || 0 != lock_memtable_mgr_ref || 0 != mds_table_mgr_ref) { if (REACH_TIME_INTERVAL(60L * 1000000)) { // 60s LOG_WARN("inner tablet memtable mgr can't destroy", K(tx_data_memtable_mgr_ref), K(tx_ctx_memtable_mgr_ref), K(lock_memtable_mgr_ref), K(mds_table_mgr_ref)); } is_safe = false; } else { tx_data_memtable_mgr_.destroy(); tx_ctx_memtable_mgr_.destroy(); lock_memtable_mgr_.destroy(); mds_table_mgr_.destroy(); } if (is_safe) { bool is_wait_gc = false; if (OB_FAIL(t3m->has_meta_wait_gc(is_wait_gc))) { LOG_WARN("failed to check has_meta_wait_gc", K(ret)); is_safe = false; } else { is_safe = !is_wait_gc; } } } return ret; } int ObLSTabletService::delete_all_tablets() { int ret = OB_SUCCESS; if (OB_NOT_NULL(ls_)) { const ObLSID &ls_id = ls_->get_ls_id(); ObSArray tablet_id_array; GetAllTabletIDOperator op(tablet_id_array); ObTimeGuard time_guard("ObLSTabletService::delete_all_tablets", 1_s); common::ObBucketWLockAllGuard lock_guard(bucket_lock_); time_guard.click("Lock"); if (OB_FAIL(tablet_id_set_.foreach(op))) { LOG_WARN("failed to traverse tablet id set", K(ret), K(ls_id)); } else if (tablet_id_array.empty()) { // tablet id array is empty, do nothing } else { for (int64_t i = 0; OB_SUCC(ret) && i < tablet_id_array.count(); ++i) { const ObTabletID &tablet_id = tablet_id_array.at(i); if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) { LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id)); ob_usleep(1000 * 1000); ob_abort(); } } time_guard.click("RemoveTablet"); if (OB_SUCC(ret)) { report_tablet_to_rs(tablet_id_array); time_guard.click("ReportToRS"); } } } return ret; } int ObLSTabletService::remove_tablet(const ObTabletHandle& tablet_handle) { int ret = OB_SUCCESS; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_handle.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid tablet", K(ret), K(tablet_handle)); } else { const ObTablet &target_tablet = *(tablet_handle.get_obj()); const ObLSID ls_id = ls_->get_ls_id(); const ObTabletID tablet_id = target_tablet.get_tablet_meta().tablet_id_; const ObTabletMapKey key(ls_id, tablet_id); ObTabletHandle cur_tablet_handle; ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); if (OB_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, cur_tablet_handle))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_SUCCESS; LOG_INFO("tablet does not exist, maybe already deleted", K(ret), K(key)); } else { LOG_WARN("failed to get tablet", K(ret), K(key)); } } else if (&target_tablet != cur_tablet_handle.get_obj()) { ret = OB_EAGAIN; LOG_INFO("tablet object has been changed, need retry", K(ret), K(key), K(target_tablet), KPC(cur_tablet_handle.get_obj())); } else { if (OB_FAIL(ObTabletSlogHelper::write_remove_tablet_slog(ls_id, tablet_id))) { LOG_WARN("failed to write remove tablet slog", K(ret), K(ls_id), K(tablet_id)); } else if (OB_FAIL(tablet_handle.get_obj()->wait_release_memtables())) { LOG_ERROR("failed to release memtables", K(ret), K(tablet_id)); } else if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) { LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id)); ob_usleep(1000 * 1000); ob_abort(); } else { report_tablet_to_rs(tablet_id); } } } return ret; } int ObLSTabletService::remove_tablets(const common::ObIArray &tablet_id_array) { int ret = OB_SUCCESS; const int64_t tablet_cnt = tablet_id_array.count(); ObSArray all_tablet_id_hash_array; ObSArray tablet_ids; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(0 == tablet_cnt)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args, tablet id array is empty", K(ret), K(tablet_id_array)); } else if (OB_FAIL(all_tablet_id_hash_array.reserve(tablet_cnt))) { LOG_WARN("failed to reserve memory for array", K(ret), K(tablet_cnt)); } else if (OB_FAIL(tablet_ids.reserve(tablet_cnt))) { LOG_WARN("failed to reserve memory for array", K(ret), K(tablet_cnt)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < tablet_cnt; ++i) { const ObTabletID &tablet_id = tablet_id_array.at(i); if (OB_FAIL(all_tablet_id_hash_array.push_back(tablet_id.hash()))) { LOG_WARN("failed to push back tablet id hash value", K(ret), K(tablet_id)); } } } if (OB_SUCC(ret)) { ObMetaDiskAddr tablet_addr; ObTimeGuard time_guard("ObLSTabletService::remove_tablets", 1_s); ObMultiBucketLockGuard lock_guard(bucket_lock_, true/*is_write_lock*/); if (OB_FAIL(lock_guard.lock_multi_buckets(all_tablet_id_hash_array))) { LOG_WARN("failed to lock multi buckets", K(ret)); } else { time_guard.click("Lock"); const share::ObLSID &ls_id = ls_->get_ls_id(); ObTabletHandle tablet_handle; ObTabletMapKey key; key.ls_id_ = ls_id; // check tablet existence for (int64_t i = 0; OB_SUCC(ret) && i < tablet_cnt; ++i) { const ObTabletID &tablet_id = tablet_id_array.at(i); key.tablet_id_ = tablet_id; tablet_addr.reset(); if (OB_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, tablet_handle))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_SUCCESS; LOG_INFO("tablet does not exist, maybe already deleted", K(ret), K(key)); } else { LOG_WARN("failed to get tablet", K(ret), K(key)); } } else if (OB_FAIL(tablet_handle.get_obj()->wait_release_memtables())) { LOG_ERROR("failed to release memtables", K(ret), K(tablet_id)); } else if (OB_FAIL(tablet_handle.get_obj()->get_meta_disk_addr(tablet_addr))) { LOG_WARN("failed to get tablet addr", K(ret), K(key)); } else if (!tablet_addr.is_disked()) { if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) { LOG_WARN("failed to remove non disked tablet from memory", K(ret), K(key)); } else { FLOG_INFO("succeeded to remove non disked tablet from memory", K(ret), K(key)); } } else if (OB_FAIL(tablet_ids.push_back(tablet_id))) { LOG_WARN("failed to push back tablet id", K(ret), K(tablet_id)); } } // write slog and do remove tablet if (OB_FAIL(ret)) { } else if (tablet_ids.empty()) { LOG_INFO("all tablets already deleted, do nothing", K(ret), K(ls_id), K(tablet_id_array)); } else if (OB_FAIL(ObTabletSlogHelper::write_remove_tablet_slog(ls_id, tablet_ids))) { LOG_WARN("failed to write remove tablet slog", K(ret), K(ls_id), K(tablet_ids)); } else { time_guard.click("WrSlog"); for (int64_t i = 0; OB_SUCC(ret) && i < tablet_ids.count(); ++i) { const ObTabletID &tablet_id = tablet_ids.at(i); if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) { LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id)); ob_usleep(1000 * 1000); ob_abort(); } } if (OB_SUCC(ret)) { report_tablet_to_rs(tablet_ids); time_guard.click("ReportToRS"); } } } } return ret; } int ObLSTabletService::do_remove_tablet(const ObTabletMapKey &key) { int ret = OB_SUCCESS; ObTimeGuard time_guard("RmTabletLock", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash()); time_guard.click("Lock"); if (OB_FAIL(inner_remove_tablet(key.ls_id_, key.tablet_id_))) { LOG_WARN("fail to remove tablet with lock", K(ret), K(key)); } return ret; } // TODO(yunshan.tys) cope with failure of deleting tablet (tablet hasn't been loaded from disk) int ObLSTabletService::inner_remove_tablet( const share::ObLSID &ls_id, const ObTabletID &tablet_id) { int ret = OB_SUCCESS; const ObTabletMapKey key(ls_id, tablet_id); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); if (OB_FAIL(tablet_id_set_.erase(tablet_id))) { if (OB_HASH_NOT_EXIST == ret) { // tablet id is already erased ret = OB_SUCCESS; } else { LOG_WARN("fail to erase tablet id from set", K(ret), K(ls_id), K(tablet_id)); } } if (OB_SUCC(ret)) { // loop retry to delete tablet from t3m while (OB_FAIL(t3m->del_tablet(key))) { if (REACH_TIME_INTERVAL(10 * 1000 * 1000)) { LOG_ERROR("failed to delete tablet from t3m", K(ret), K(ls_id), K(tablet_id)); } } } if (OB_SUCC(ret)) { FLOG_INFO("succeeded to remove tablet", K(ret), K(ls_id), K(tablet_id)); } return ret; } int ObLSTabletService::get_tablet( const ObTabletID &tablet_id, ObTabletHandle &handle, const int64_t timeout_us, const ObMDSGetTabletMode mode) { int ret = OB_SUCCESS; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || mode < ObMDSGetTabletMode::READ_ALL_COMMITED)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(mode)); } else if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle, timeout_us, mode, ObTransVersion::MAX_TRANS_VERSION))) { if (OB_TABLET_NOT_EXIST == ret) { LOG_DEBUG("failed to check and get tablet", K(ret), K(key), K(timeout_us), K(mode)); } else { LOG_WARN("failed to check and get tablet", K(ret), K(key), K(timeout_us), K(mode)); } } return ret; } int ObLSTabletService::get_tablet_addr(const ObTabletMapKey &key, ObMetaDiskAddr &addr) { int ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else { // 加读锁保证ckpt与对tablet的操作串行, 防止ckpt时tablet操作处在 // slog已经写入而tablet addr未更新的状态,导致slog丢失 ObBucketHashRLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash()); if (OB_FAIL(t3m->get_tablet_addr(key, addr))) { LOG_WARN("fail to get tablet addr", K(ret), K(key)); } } return ret; } void ObLSTabletService::report_tablet_to_rs(const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; const share::ObLSID &ls_id = ls_->get_ls_id(); if (tablet_id.is_ls_inner_tablet()) { // no need to report for ls inner tablet } else if (OB_FAIL(MTL(ObTabletTableUpdater*)->submit_tablet_update_task(ls_id, tablet_id))) { LOG_WARN("failed to report tablet info", KR(ret), K(ls_id), K(tablet_id)); } } void ObLSTabletService::report_tablet_to_rs( const common::ObIArray &tablet_id_array) { int ret = OB_SUCCESS; const uint64_t tenant_id = MTL_ID(); const share::ObLSID &ls_id = ls_->get_ls_id(); // ignore ret on purpose for (int64_t i = 0; i < tablet_id_array.count(); ++i) { const common::ObTabletID &tablet_id = tablet_id_array.at(i); if (tablet_id.is_ls_inner_tablet()) { // no need to report for ls inner tablet continue; } else if (OB_FAIL(MTL(ObTabletTableUpdater*)->submit_tablet_update_task(ls_id, tablet_id))) { LOG_WARN("failed to report tablet info", KR(ret), K(tenant_id), K(ls_id), K(tablet_id)); } } } int ObLSTabletService::table_scan(ObTabletHandle &tablet_handle, ObTableScanIterator &iter, ObTableScanParam ¶m) { int ret = OB_SUCCESS; NG_TRACE(S_table_scan_begin); AllowToReadMgr::AllowToReadInfo read_info; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (FALSE_IT(allow_to_read_mgr_.load_allow_to_read_info(read_info))) { } else if (!read_info.allow_to_read()) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_)); } else if (OB_FAIL(prepare_scan_table_param(param, *(MTL(ObTenantSchemaService*)->get_schema_service())))) { LOG_WARN("failed to prepare scan table param", K(ret), K(param)); } else if (OB_FAIL(inner_table_scan(tablet_handle, iter, param))) { LOG_WARN("failed to do table scan", K(ret), KP(&iter), K(param)); } else { bool is_same = false; allow_to_read_mgr_.check_read_info_same(read_info, is_same); if (!is_same) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_), KP(&iter)); } } NG_TRACE(S_table_scan_end); return ret; } int ObLSTabletService::table_rescan(ObTabletHandle &tablet_handle, ObTableScanParam ¶m, ObNewRowIterator *result) { int ret = OB_SUCCESS; NG_TRACE(S_table_rescan_begin); AllowToReadMgr::AllowToReadInfo read_info; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K(result), K_(is_inited)); } else if (OB_ISNULL(result)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret)); } else if (FALSE_IT(allow_to_read_mgr_.load_allow_to_read_info(read_info))) { } else if (!read_info.allow_to_read()) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_)); } else if (OB_FAIL(prepare_scan_table_param(param, *(MTL(ObTenantSchemaService*)->get_schema_service())))) { LOG_WARN("failed to prepare scan table param", K(ret), K(result), K(param)); } else { ObTableScanIterator *iter = static_cast(result); if (OB_FAIL(inner_table_scan(tablet_handle, *iter, param))) { LOG_WARN("failed to do table scan", K(ret), K(result), K(param)); } } if (OB_SUCC(ret)) { bool is_same = false; allow_to_read_mgr_.check_read_info_same(read_info, is_same); if (!is_same) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_)); } } NG_TRACE(S_table_rescan_end); return ret; } int ObLSTabletService::refresh_tablet_addr( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, ObTabletHandle &tablet_handle) { int ret = OB_SUCCESS; const ObTabletMapKey key(ls_id, tablet_id); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); while (OB_SUCC(ret)) { ret = tablet_id_set_.set(tablet_id); if (OB_SUCC(ret)) { break; } else if (OB_ALLOCATE_MEMORY_FAILED == ret) { usleep(100 * 1000); if (REACH_COUNT_INTERVAL(100)) { LOG_ERROR("no memory for tablet id set, retry", K(ret), K(tablet_id)); } ret = OB_SUCCESS; } else { LOG_WARN("fail to set tablet id set", K(ret), K(tablet_id)); } } if (OB_FAIL(ret)) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) { LOG_WARN("failed to add tablet to meta mem mgr", K(ret), K(key), K(tablet_handle)); } return ret; } int ObLSTabletService::trim_old_tablets(const ObTabletID &tablet_id) { int ret = OB_SUCCESS; ObTabletHandle tablet_handle_head; ObTimeGuard time_guard("ObLSTabletService::trim_old_tablets", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle_head))) { LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id)); } else if (tablet_handle_head.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle_head.get_obj()); } else if (OB_UNLIKELY(!tablet_handle_head.get_obj()->get_tablet_meta().has_next_tablet_)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("doesn't have old tablet", K(ret), "tablet_meta", tablet_handle_head.get_obj()->get_tablet_meta()); } else { time_guard.click("GetTablet"); ObTablet *tablet_head = tablet_handle_head.get_obj(); ObTabletHandle new_tablet_handle; ObLSID ls_id = tablet_head->get_tablet_meta().ls_id_; tablet_head->trim_tablet_list(); ObMetaDiskAddr disk_addr; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet_head, new_tablet_handle))) { LOG_WARN("fail to persist and transfor tablet", K(ret), KPC(tablet_head), K(new_tablet_handle)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->get_tablet_addr())) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("failed to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(MTL(ObTenantMetaMemMgr*)->compare_and_swap_tablet( key, tablet_handle_head, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle_head), K(new_tablet_handle)); ob_usleep(1000 * 1000); ob_abort(); } else { time_guard.click("CASwap"); FLOG_INFO("succeeded to trim tablets list", K(key), K(disk_addr)); } } return ret; } int ObLSTabletService::rollback_rebuild_tablet(const ObTabletID &tablet_id) { int ret = OB_SUCCESS; ObTabletHandle tablet_handle_head; ObTimeGuard time_guard("ObLSTabletService::rollback_rebuild_tablet", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle_head))) { LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id)); } else if (tablet_handle_head.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle_head.get_obj()); } else { time_guard.click("GetTablet"); ObTablet *tablet_head = tablet_handle_head.get_obj(); ObTabletHandle next_tablet_handle; ObMetaObj meta_obj; tablet_head->get_next_tablet_guard().get_obj(meta_obj); next_tablet_handle.set_obj(meta_obj); next_tablet_handle.set_wash_priority(WashTabletPriority::WTP_LOW); const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); ObMetaDiskAddr disk_addr; ObTabletHandle new_tablet_handle; if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet( *next_tablet_handle.get_obj(), new_tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), K(next_tablet_handle), K(new_tablet_handle)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->get_tablet_addr())) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog( key.ls_id_, tablet_id, disk_addr))) { LOG_WARN("failed to write update tablet slog", K(ret), K(key), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(MTL(ObTenantMetaMemMgr*)->compare_and_swap_tablet( key, tablet_handle_head, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle_head), K(new_tablet_handle)); ob_usleep(1000 * 1000); ob_abort(); } else { time_guard.click("CASwap"); FLOG_INFO("succeeded to rollback rebuild", K(key), K(disk_addr)); } } return ret; } int ObLSTabletService::rebuild_tablet_with_old( const ObMigrationTabletParam &mig_tablet_param, ObTabletHandle &tablet_guard) { int ret = OB_SUCCESS; ObTimeGuard time_guard("ObLSTabletService::rebuild_tablet_with_old", 1_s); common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "RebuildTablet")); ObTabletHandle old_tablet_hdl; ObTabletHandle tmp_tablet_hdl; ObTabletHandle new_tablet_hdl; ObTablet *tmp_tablet = nullptr; ObFreezer *freezer = ls_->get_freezer(); ObMetaDiskAddr disk_addr; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_; const share::ObLSID &ls_id = mig_tablet_param.ls_id_; const ObTabletMapKey key(ls_id, tablet_id); if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) { LOG_WARN("failed to get tablet", K(ret), K(key)); } else if (FALSE_IT(time_guard.click("GetTablet"))) { } else if (old_tablet_hdl.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_hdl.get_obj()); } else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) { LOG_WARN("fail to acquire temporary tablet", K(ret), K(key)); } else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) { } else if (OB_FAIL(tmp_tablet->init_with_migrate_param(allocator, mig_tablet_param, true/*is_update*/, freezer))) { LOG_WARN("failed to init tablet", K(ret), K(mig_tablet_param)); } else if (FALSE_IT(time_guard.click("InitTablet"))) { } else if (FALSE_IT(tmp_tablet->set_next_tablet_guard(tablet_guard))) { } else if (FALSE_IT(time_guard.click("InitTablet"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_hdl, new_tablet_hdl))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_hdl), K(new_tablet_hdl)); ob_usleep(1000 * 1000); ob_abort(); } else if (OB_FAIL(new_tablet_hdl.get_obj()->start_ddl_if_need())) { LOG_WARN("start ddl if need failed", K(ret), K(key)); } else { time_guard.click("CASwap"); LOG_INFO("rebuild tablet with old succeed", K(ret), K(key), K(disk_addr)); } return ret; } int ObLSTabletService::migrate_update_tablet( const ObMigrationTabletParam &mig_tablet_param) { int ret = OB_SUCCESS; ObTimeGuard time_guard("ObLSTabletService::migrate_update_tablet", 1_s); common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "MigUpTab")); const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_; const share::ObLSID &ls_id = mig_tablet_param.ls_id_; const ObTabletMapKey key(mig_tablet_param.ls_id_, mig_tablet_param.tablet_id_); ObTabletHandle old_tablet_hdl; ObTabletHandle tmp_tablet_hdl; ObTabletHandle new_tablet_hdl; ObTablet *new_tablet = nullptr; ObMetaDiskAddr disk_addr; ObFreezer *freezer = ls_->get_freezer(); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) { LOG_WARN("failed to get tablet", K(ret), K(key)); } else if (FALSE_IT(time_guard.click("GetTablet"))) { } else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) { LOG_WARN("fail to acquire temporary tablet", K(ret), K(key)); } else if (FALSE_IT(new_tablet = tmp_tablet_hdl.get_obj())) { } else if (OB_FAIL(new_tablet->init_with_migrate_param(allocator, mig_tablet_param, true/*is_update*/, freezer))) { LOG_WARN("failed to init tablet", K(ret), K(mig_tablet_param)); } else if (FALSE_IT(time_guard.click("InitTablet"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*new_tablet, new_tablet_hdl))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(new_tablet), K(new_tablet_hdl)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_hdl, new_tablet_hdl))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_hdl), K(new_tablet_hdl)); ob_usleep(1000 * 1000); ob_abort(); } else if (OB_FAIL(new_tablet_hdl.get_obj()->start_ddl_if_need())) { LOG_WARN("start ddl if need failed", K(ret)); } else { time_guard.click("CASwap"); LOG_INFO("migrate update tablet succeed", K(ret), K(key), K(disk_addr)); } return ret; } int ObLSTabletService::migrate_create_tablet( const ObMigrationTabletParam &mig_tablet_param, ObTabletHandle &handle) { int ret = OB_SUCCESS; ObTimeGuard time_guard("ObLSTabletService::migrate_create_tablet", 1_s); common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "MigCreateTab")); const share::ObLSID &ls_id = mig_tablet_param.ls_id_; const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_; const ObTabletMapKey key(ls_id, tablet_id); ObFreezer *freezer = ls_->get_freezer(); ObTabletHandle tmp_tablet_hdl; ObTabletHandle tablet_handle; ObMetaDiskAddr disk_addr; if (OB_FAIL(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tmp_tablet_hdl))) { LOG_WARN("fail to create temporary tablet", K(ret), K(key)); } else if (OB_FAIL(tmp_tablet_hdl.get_obj()->init_with_migrate_param(allocator, mig_tablet_param, false/*is_update*/, freezer))) { LOG_WARN("fail to init tablet", K(ret), K(mig_tablet_param)); } else if (FALSE_IT(time_guard.click("InitTablet"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet_hdl.get_obj(), tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), K(tmp_tablet_hdl), K(tablet_handle)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = tablet_handle.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(refresh_tablet_addr(ls_id, tablet_id, tablet_handle))) { LOG_WARN("failed to refresh tablet addr", K(ret), K(ls_id), K(tablet_id), K(lbt())); ob_usleep(1000 * 1000); ob_abort(); } else if (FALSE_IT(time_guard.click("RefreshAddr"))) { } else if (OB_FAIL(tablet_handle.get_obj()->start_ddl_if_need())) { LOG_WARN("start ddl if need failed", K(ret)); } else { LOG_INFO("migrate create tablet succeed", K(ret), K(key), K(disk_addr)); } if (OB_SUCC(ret)) { handle = tablet_handle; } else { int tmp_ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); if (OB_TMP_FAIL(tablet_id_set_.erase(tablet_id))) { if (OB_HASH_NOT_EXIST != tmp_ret) { LOG_ERROR("fail to erase tablet id from set", K(tmp_ret), K(tablet_id)); } } if (OB_TMP_FAIL(inner_remove_tablet(key.ls_id_, key.tablet_id_))) { LOG_WARN("fail to erase tablet from meta memory manager", K(tmp_ret), K(key)); } } return ret; } int ObLSTabletService::refresh_memtable_for_ckpt( const ObMetaDiskAddr &old_addr, const ObMetaDiskAddr &cur_addr, ObTabletHandle &new_tablet_handle) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!old_addr.is_equal_for_persistence(cur_addr))) { ret = OB_NOT_THE_OBJECT; LOG_WARN("the old tablet has been replaced", K(ret), K(old_addr), K(cur_addr)); } else if (OB_UNLIKELY(old_addr != cur_addr)) { // memtables were updated if (OB_FAIL(new_tablet_handle.get_obj()->refresh_memtable_and_update_seq(cur_addr.seq()))) { LOG_WARN("fail to pull newest memtables", K(ret), K(old_addr), K(cur_addr), K(new_tablet_handle)); } } return ret; } int ObLSTabletService::update_tablet_checkpoint( const ObTabletMapKey &key, const ObMetaDiskAddr &old_addr, const ObMetaDiskAddr &new_addr, const bool is_replay_old, ObTabletHandle &new_handle) { int ret = OB_SUCCESS; ObTimeGuard time_guard("UpdateTabletCKPT", 3_s); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ls tablet svr hasn't been inited", K(ret)); } else if (OB_UNLIKELY(!key.is_valid() || !old_addr.is_valid() || !new_addr.is_valid() || !new_addr.is_block() || (!is_replay_old && !new_handle.is_valid()))) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(key), K(new_addr), K(new_handle)); } else { common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "CKPTUpdate")); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObTabletHandle tablet_handle; ObMetaDiskAddr addr; ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash()); time_guard.click("Lock"); if (OB_FAIL(t3m->get_tablet_addr(key, addr))) { if (OB_ENTRY_NOT_EXIST == ret) { ret = OB_TABLET_NOT_EXIST; } LOG_WARN("fail to get old tablet addr", K(ret), K(key)); } else if (!is_replay_old) { if (OB_FAIL(t3m->get_tablet(WashTabletPriority::WTP_LOW, key, tablet_handle))) { LOG_WARN("fail to get tablet", K(ret), K(key)); } else if (FALSE_IT(time_guard.click("GetOld"))) { } else if (OB_FAIL(refresh_memtable_for_ckpt(old_addr, addr, new_handle))) { LOG_WARN("fail to update tablet", K(ret), K(old_addr), K(addr), K(new_handle)); } else if (FALSE_IT(time_guard.click("UpdateTablet"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_handle))) { LOG_WARN("fail to compare and swap tablet", K(ret), K(tablet_handle), K(new_handle)); } } else { time_guard.click("GetOld"); if (OB_UNLIKELY(addr != old_addr)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("the old tablet has been replaced, which is not allowed during upgrade", K(ret), K(addr), K(old_addr)); } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_addr, new_addr))) { LOG_WARN("fail to compare and swap tablet", K(ret), K(old_addr), K(new_addr)); } } if (OB_SUCC(ret)) { time_guard.click("CASwap"); FLOG_INFO("succeeded to update tablet ckpt", K(key), K(old_addr), K(new_addr), K(is_replay_old)); } } return ret; } int ObLSTabletService::update_tablet_table_store( const ObTabletHandle &old_tablet_handle, const ObIArray &tables) { int ret = OB_SUCCESS; common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "UpTabStore")); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ls tablet svr hasn't been inited", K(ret)); } else if (OB_UNLIKELY(!old_tablet_handle.is_valid() || 0 == tables.count())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("old tablet handle is invalid", K(ret), K(old_tablet_handle), K(tables.count())); } else { ObTablet *old_tablet = old_tablet_handle.get_obj(); const common::ObTabletID &tablet_id = old_tablet->get_tablet_meta().tablet_id_; ObTimeGuard time_guard("ObLSTabletService::ReplaceSSTable", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObTabletHandle tablet_handle; if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_EAGAIN; LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id)); } else { LOG_WARN("fail to get tablet", K(ret)); } } else if (tablet_handle.get_obj() != old_tablet) { ret = OB_EAGAIN; LOG_WARN("tablet has changed, skip it", K(ret), K(tablet_handle), K(old_tablet_handle)); } else if (old_tablet->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet); } else { time_guard.click("GetTablet"); ObTabletHandle tmp_tablet_hdl; ObTabletHandle new_tablet_hdl; ObTablet *tmp_tablet = nullptr; const share::ObLSID &ls_id = ls_->get_ls_id(); const ObTabletMapKey key(ls_id, tablet_id); ObMetaDiskAddr disk_addr; if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) { LOG_WARN("fail to acquire temporary tablet", K(ret), K(key)); } else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) { } else if (OB_FAIL(tmp_tablet->init_for_defragment(allocator, tables, *old_tablet))) { LOG_WARN("fail to init new tablet", K(ret), KPC(old_tablet)); } else if (FALSE_IT(time_guard.click("InitTablet"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl)); } else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_hdl))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_hdl)); ob_usleep(1000 * 1000); ob_abort(); } else { time_guard.click("CASwap"); LOG_INFO("succeeded to build new tablet", K(ret), K(disk_addr), K(new_tablet_hdl), KPC(new_tablet_hdl.get_obj())); } } } return ret; } int ObLSTabletService::update_tablet_table_store( const common::ObTabletID &tablet_id, const ObUpdateTableStoreParam ¶m, ObTabletHandle &handle) { int ret = OB_SUCCESS; common::ObArenaAllocator allocator("UpdateTmpTablet", OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID(), ObCtxIds::DEFAULT_CTX_ID); if (share::is_reserve_mode()) { // TODO(@DanLing) use LocalArena later allocator.set_ctx_id(ObCtxIds::MERGE_RESERVE_CTX_ID); } const share::ObLSID &ls_id = ls_->get_ls_id(); const ObTabletMapKey key(ls_id, tablet_id); ObTabletHandle old_tablet_hdl; ObTabletHandle tmp_tablet_hdl; ObTabletHandle new_tablet_hdl; ObTimeGuard time_guard("ObLSTabletService::UpdateTableStore", 1_s); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || !param.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(param)); } else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) { if (OB_ENTRY_NOT_EXIST == ret) { ret = OB_TABLET_NOT_EXIST; } else { LOG_WARN("fail to acquire temporary tablet", K(ret), K(key)); } } else { ObTablet *tmp_tablet = tmp_tablet_hdl.get_obj(); time_guard.click("Acquire"); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (old_tablet_hdl.get_obj()->is_empty_shell()) { handle = old_tablet_hdl; LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_hdl.get_obj()); } else { time_guard.click("GetTablet"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObTablet *old_tablet = old_tablet_hdl.get_obj(); ObMetaDiskAddr disk_addr; if (OB_FAIL(tmp_tablet->init_for_merge(allocator, param, *old_tablet))) { LOG_WARN("failed to init tablet", K(ret), K(param), KPC(old_tablet)); } else if (FALSE_IT(time_guard.click("InitNew"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl)); } else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_hdl, new_tablet_hdl))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_hdl), K(new_tablet_hdl)); ob_usleep(1000 * 1000); ob_abort(); } else if (FALSE_IT(time_guard.click("CASwap"))) { } else { handle = new_tablet_hdl; LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(param), K(handle)); } } } return ret; } int ObLSTabletService::update_tablet_mstx( const ObTabletMapKey &key, const ObMetaDiskAddr &old_addr, const ObTabletHandle &old_tablet_handle, ObTabletHandle &new_tablet_handle) { int ret = OB_SUCCESS; ObTablet *new_tablet = nullptr; ObMetaDiskAddr new_addr; ObTimeGuard time_guard("ObLSTabletService::update_tablet_mstx", 1_s); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!key.is_valid() || !old_addr.is_valid() || !old_tablet_handle.is_valid() || !new_tablet_handle.is_valid() || !(new_tablet = new_tablet_handle.get_obj())->is_valid() || !(new_addr = new_tablet->get_tablet_addr()).is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(key), K(old_addr), K(old_tablet_handle), K(new_tablet_handle), KPC(new_tablet), K(new_addr)); } else { ObMetaDiskAddr addr; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash()); time_guard.click("Lock"); ObTabletHandle curr_tablet_handle; if (OB_FAIL(direct_get_tablet(key.tablet_id_, curr_tablet_handle))) { if (OB_ENTRY_NOT_EXIST == ret) { ret = OB_SUCCESS; // deleted, skip } else { LOG_WARN("fail to get tablet", K(ret), K(key)); } } else if (curr_tablet_handle.get_obj() != old_tablet_handle.get_obj()) { // we could never persist this tablet, skip this LOG_INFO("tablet has been changed", K(ret), K(key), K(old_addr), K(old_tablet_handle), K(curr_tablet_handle)); } else if (FALSE_IT(addr = curr_tablet_handle.get_obj()->get_tablet_addr())) { } else if (old_addr != addr) { /* the same full tablet obj with different memtables will hit this */ // Let this updating fail and throw tablet back to the persist queue. // It will be tackled correctly in the next round because its address will be compared // again in ObFullTabletCreator::persist_tablet() ret = common::OB_NOT_THE_OBJECT; LOG_WARN("old address has changed, skip update", K(ret), K(key), K(addr), K(old_addr)); } else { time_guard.click("GetOld"); if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, key.tablet_id_, new_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(key), K(new_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_handle)); ob_usleep(1000 * 1000); ob_abort(); } else if (FALSE_IT(time_guard.click("CASwap"))) { } else { FLOG_INFO("succeeded to update tablet mstx", K(ret), K(key), K(old_addr), K(old_tablet_handle), K(new_addr), K(new_tablet_handle)); } } } return ret; } int ObLSTabletService::update_tablet_to_empty_shell(const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; const share::ObLSID &ls_id = ls_->get_ls_id(); const ObTabletMapKey key(ls_id, tablet_id); common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "UpdEmptySh")); ObTabletHandle new_tablet_handle; ObTabletHandle tmp_tablet_handle; ObTabletHandle old_tablet_handle; ObTimeGuard time_guard("UpdateTabletToEmptyShell", 3_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ls tablet svr hasn't been inited", K(ret)); } else if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id)); } else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (old_tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj()); } else if (FALSE_IT(time_guard.click("GetOld"))) { } else if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_handle))) { LOG_WARN("fail to acquire temporary tablet", K(ret), K(key)); } else { time_guard.click("Acquire"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObTablet *old_tablet = old_tablet_handle.get_obj(); ObTablet *tmp_tablet = tmp_tablet_handle.get_obj(); ObTablet *new_tablet = nullptr; ObMetaDiskAddr disk_addr; if (OB_FAIL(tmp_tablet->init_empty_shell(*tmp_tablet_handle.get_allocator(), *old_tablet))) { LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet)); } else if (FALSE_IT(time_guard.click("InitNew"))) { } else if (OB_FAIL(ObTabletPersister::transform_empty_shell(*tmp_tablet, new_tablet_handle))) { LOG_WARN("fail to transform emtpy shell", K(ret), K(tablet_id)); } else if (FALSE_IT(time_guard.click("Trans"))) { } else if (FALSE_IT(new_tablet = new_tablet_handle.get_obj())) { } else if (OB_FAIL(ObTabletSlogHelper::write_empty_shell_tablet_slog(new_tablet, disk_addr))) { LOG_WARN("fail to write emtpy shell tablet slog", K(ret), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(new_tablet->tablet_addr_ = disk_addr)) { } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_handle)); ob_usleep(1000 * 1000); ob_abort(); } else { ls_->get_tablet_gc_handler()->set_tablet_gc_trigger(); time_guard.click("CASwap"); LOG_INFO("succeeded to build empty shell tablet", K(ret), K(key), K(disk_addr)); } } return ret; } int ObLSTabletService::update_medium_compaction_info( const common::ObTabletID &tablet_id, ObTabletHandle &handle) { int ret = OB_SUCCESS; common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "UpMeidumCom")); ObTabletHandle old_tablet_handle; ObTimeGuard time_guard("ObLSTabletService::update_medium_compaction_info", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id)); } else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) { LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id)); } else if (old_tablet_handle.get_obj()->is_empty_shell()) { handle = old_tablet_handle; LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj()); } else { time_guard.click("GetTablet"); ObTabletHandle tmp_tablet_hdl; ObTabletHandle new_tablet_hdl; ObTablet *tmp_tablet = nullptr; ObTablet *old_tablet = old_tablet_handle.get_obj(); const share::ObLSID &ls_id = ls_->get_ls_id(); const ObTabletMapKey key(ls_id, tablet_id); ObMetaDiskAddr disk_addr; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) { if (OB_ENTRY_NOT_EXIST == ret) { ret = OB_TABLET_NOT_EXIST; } else { LOG_WARN("failed to acquire tablet", K(ret), K(key)); } } else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) { } else if (OB_FAIL(tmp_tablet->init_with_update_medium_info(allocator, *old_tablet))) { LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet)); } else if (FALSE_IT(time_guard.click("InitNew"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl)); } else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_hdl))) { LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_hdl)); } else if (FALSE_IT(time_guard.click("CASwap"))) { } else { handle = new_tablet_hdl; } } return ret; } int ObLSTabletService::build_new_tablet_from_mds_table( const common::ObTabletID &tablet_id, const int64_t mds_construct_sequence, const share::SCN &flush_scn) { TIMEGUARD_INIT(STORAGE, 10_ms); int ret = OB_SUCCESS; common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "BuildMSD")); const share::ObLSID &ls_id = ls_->get_ls_id(); const ObTabletMapKey key(ls_id, tablet_id); ObTabletHandle old_tablet_handle; ObTabletHandle tmp_tablet_hdl; ObTabletHandle new_tablet_handle; ObTimeGuard time_guard("MdsDump", 3_s); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id)); } else if (CLICK_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) { LOG_WARN("failed to acquire tablet", K(ret), K(key)); } else { ObTablet *tmp_tablet = tmp_tablet_hdl.get_obj(); time_guard.click("Acquire"); CLICK(); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (CLICK_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (old_tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip mds table dump operation", K(ret), "old_tablet", *old_tablet_handle.get_obj()); } else { time_guard.click("GetOld"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObTablet *old_tablet = old_tablet_handle.get_obj(); ObMetaDiskAddr disk_addr; ObArenaAllocator arena_allocator(common::ObMemAttr(MTL_ID(), "mds_reader")); ObTabletMdsData mds_data; if (OB_FAIL(ret)) { } else if (CLICK_FAIL(old_tablet->read_mds_table(arena_allocator, mds_data, true, mds_construct_sequence))) { if (OB_EMPTY_RESULT == ret) { ret = OB_SUCCESS; LOG_INFO("read nothing from mds table, no need to build new tablet", K(ret), K(key)); } else { LOG_WARN("failed to read mds table", K(ret), K(key)); } } else if (CLICK_FAIL(tmp_tablet->init_for_mds_table_dump(allocator, *old_tablet, flush_scn, mds_data, old_tablet->mds_data_))) { LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet), K(flush_scn)); } else if (CLICK_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_handle)); } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) { } else if (CLICK_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { } else if (FALSE_IT(time_guard.click("WrSlog"))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (CLICK_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(disk_addr), K(old_tablet_handle)); ob_usleep(1000 * 1000); ob_abort(); } else { CLICK(); time_guard.click("CASwap"); LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(new_tablet_handle), K(mds_data)); } } } return ret; } int ObLSTabletService::update_tablet_release_memtable_for_offline( const common::ObTabletID &tablet_id, const SCN scn) { int ret = OB_SUCCESS; const ObLSID ls_id(ls_->get_ls_id()); const ObTabletMapKey key(ls_id, tablet_id); ObTabletHandle tablet_handle; ObTablet *tablet = nullptr; ObTimeGuard time_guard("ObLSTabletService::update_tablet_release_memtable", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || !scn.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(scn)); } else if (OB_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, tablet_handle))) { LOG_WARN("fail to direct get tablet", K(ret), K(key)); } else if (OB_ISNULL(tablet = tablet_handle.get_obj())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("tablet should not be NULL", K(ret), K(key)); } else if (tablet->is_empty_shell()) { //do nothing } else { time_guard.click("get_tablet"); ObITable *table = nullptr; ObTableStoreIterator iter; const bool is_from_buf_pool = nullptr == tablet_handle.get_obj()->get_allocator(); if (is_from_buf_pool) { ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObTabletHandle new_tablet_handle; if (OB_FAIL(ObTabletPersister::copy_from_old_tablet(*tablet, new_tablet_handle))) { LOG_WARN("fail to copy from old tablet", K(ret), KPC(tablet)); } else if (FALSE_IT(time_guard.click("CpTablet"))) { } else if (OB_FAIL(new_tablet_handle.get_obj()->rebuild_memtables(scn))) { LOG_WARN("fail to rebuild memtables", K(ret), K(scn), K(new_tablet_handle)); } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle)); } else { time_guard.click("CASwap"); LOG_INFO("succeeded to copy tablet to release memtable", K(ret), K(key), K(tablet_handle), K(new_tablet_handle)); } } else if (OB_UNLIKELY(!tablet->get_tablet_addr().is_memory())) { ret = OB_NOT_SUPPORTED; LOG_ERROR("This tablet is full tablet, but its addr isn't memory", K(ret), KPC(tablet)); } else if (OB_FAIL(tablet->get_all_sstables(iter))) { LOG_WARN("fail to get all sstable", K(ret), K(iter)); } else if (1 == iter.count() && OB_FAIL(iter.get_next(table))) { LOG_WARN("fail to get next table", K(ret), K(iter)); } else if (OB_UNLIKELY(iter.count() > 1) || (OB_NOT_NULL(table) && (!table->is_sstable() || static_cast(table)->get_data_macro_block_count() != 0))) { ret = OB_NOT_SUPPORTED; LOG_ERROR("This tablet is full tablet, but all of its sstables isn't only one empty major", K(ret), K(iter), KPC(table)); } else if (OB_FAIL(tablet_handle.get_obj()->wait_release_memtables())) { LOG_ERROR("failed to release memtables", K(ret), K(tablet_id)); } else if (OB_FAIL(inner_remove_tablet(ls_id, tablet_id))) { LOG_ERROR("failed to do remove tablet", K(ret), K(ls_id), K(tablet_id)); } else { time_guard.click("RmTablet"); } } return ret; } int ObLSTabletService::update_tablet_report_status( const common::ObTabletID &tablet_id, const bool found_column_group_checksum_error) { int ret = OB_SUCCESS; ObTabletHandle tablet_handle; ObTimeGuard time_guard("ObLSTabletService::update_tablet_report_status", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id)); } else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj()); } else { time_guard.click("GetTablet"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObMetaDiskAddr disk_addr; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); ObTablet *tablet = tablet_handle.get_obj(); ObTabletHandle new_tablet_handle; bool need_report = true; if (OB_UNLIKELY(found_column_group_checksum_error)) { tablet->tablet_meta_.report_status_.found_cg_checksum_error_ = true; } else if (tablet->tablet_meta_.report_status_.need_report()) { tablet->tablet_meta_.report_status_.cur_report_version_ = tablet->tablet_meta_.report_status_.merge_snapshot_version_; } else { need_report = false; FLOG_INFO("tablet doesn't need to report", K(ret), K(tablet_id)); } if (need_report) { if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) { LOG_WARN("failed to write update tablet slog", K(ret), K(key), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle)); ob_usleep(1000 * 1000); ob_abort(); } else { time_guard.click("CASwap"); LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(tablet_handle)); } } } return ret; } int ObLSTabletService::update_tablet_snapshot_version( const common::ObTabletID &tablet_id, const int64_t snapshot_version) { int ret = OB_SUCCESS; common::ObArenaAllocator allocator; ObTabletHandle old_tablet_handle; ObTimeGuard time_guard("ObLSTabletService::update_tablet_snapshot_version", 1 * 1000 * 1000); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || 0 >= snapshot_version)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(snapshot_version)); } else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) { LOG_WARN("failed to check and get tablet", K(ret), K(tablet_id)); } else { time_guard.click("GetTablet"); ObTabletHandle tmp_tablet_hdl; ObTabletHandle new_tablet_hdl; ObTablet *tmp_tablet = nullptr; ObTablet *old_tablet = old_tablet_handle.get_obj(); const share::ObLSID &ls_id = ls_->get_ls_id(); const ObTabletMapKey key(ls_id, tablet_id); ObMetaDiskAddr disk_addr; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_hdl))) { if (OB_ENTRY_NOT_EXIST == ret) { ret = OB_TABLET_NOT_EXIST; } else { LOG_WARN("failed to acquire tablet", K(ret), K(key)); } } else if (FALSE_IT(tmp_tablet = tmp_tablet_hdl.get_obj())) { } else if (OB_FAIL(tmp_tablet->init_with_new_snapshot_version(allocator, *old_tablet, snapshot_version))) { LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet)); } else if (FALSE_IT(time_guard.click("InitNew"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_hdl))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_hdl)); } else if (FALSE_IT(disk_addr = new_tablet_hdl.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_hdl))) { LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(old_tablet_handle), K(new_tablet_hdl)); } else { time_guard.click("CASwap"); } } return ret; } int ObLSTabletService::update_tablet_restore_status( const common::ObTabletID &tablet_id, const ObTabletRestoreStatus::STATUS &restore_status) { int ret = OB_SUCCESS; ObTabletHandle tablet_handle; ObTabletRestoreStatus::STATUS current_status = ObTabletRestoreStatus::RESTORE_STATUS_MAX; bool can_change = false; ObTimeGuard time_guard("ObLSTabletService::update_tablet_restore_status", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid()) || OB_UNLIKELY(!ObTabletRestoreStatus::is_valid(restore_status))) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(restore_status)); } else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj()); } else { time_guard.click("GetTablet"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObMetaDiskAddr disk_addr; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); ObTablet *tablet = tablet_handle.get_obj(); ObTabletHandle new_tablet_handle; if (OB_FAIL(tablet->tablet_meta_.ha_status_.get_restore_status(current_status))) { LOG_WARN("failed to get restore status", K(ret), KPC(tablet)); } else if (OB_FAIL(ObTabletRestoreStatus::check_can_change_status(current_status, restore_status, can_change))) { LOG_WARN("failed to check can change status", K(ret), K(current_status), K(restore_status), KPC(tablet)); } else if (!can_change) { ret = OB_ERR_UNEXPECTED; LOG_WARN("can not change restore status", K(ret), K(current_status), K(restore_status), KPC(tablet)); } else if (OB_FAIL(tablet->tablet_meta_.ha_status_.set_restore_status(restore_status))) { LOG_WARN("failed to set restore status", K(ret), K(restore_status), KPC(tablet)); } else if (restore_status == ObTabletRestoreStatus::UNDEFINED && OB_FALSE_IT((void)tablet->tablet_meta_.reset_transfer_table())) { } else { // TODO(jiahua.cjh) move check valid to tablet init after generate new version tablet. if (OB_FAIL(tablet->check_valid())) { LOG_WARN("failed to check tablet valid", K(ret), K(restore_status), KPC(tablet)); } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) { LOG_WARN("failed to write update tablet slog", K(ret), K(key), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle)); ob_abort(); } else { time_guard.click("CASwap"); LOG_INFO("succeeded to build new tablet", K(ret), K(key), K(disk_addr), K(restore_status), K(tablet_handle)); } if (OB_FAIL(ret)) { int tmp_ret = OB_SUCCESS; if (OB_SUCCESS != (tmp_ret = tablet->tablet_meta_.ha_status_.set_restore_status(current_status))) { LOG_WARN("failed to set restore status", K(tmp_ret), K(current_status), KPC(tablet)); ob_abort(); } } } } return ret; } int ObLSTabletService::update_tablet_ha_data_status( const common::ObTabletID &tablet_id, const ObTabletDataStatus::STATUS &data_status) { int ret = OB_SUCCESS; ObTabletHandle tablet_handle; ObTabletDataStatus::STATUS current_status = ObTabletDataStatus::DATA_STATUS_MAX; bool can_change = false; ObTimeGuard time_guard("ObLSTabletService::update_tablet_ha_data_status", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(is_stopped_)) { ret = OB_NOT_RUNNING; LOG_WARN("tablet service stopped", K(ret)); } else if (OB_UNLIKELY(!tablet_id.is_valid()) || OB_UNLIKELY(!ObTabletDataStatus::is_valid(data_status))) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(data_status)); } else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj()); } else { time_guard.click("GetTablet"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObMetaDiskAddr disk_addr; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); ObTablet *tablet = tablet_handle.get_obj(); ObTabletHandle new_tablet_handle; if (OB_FAIL(tablet->tablet_meta_.ha_status_.get_data_status(current_status))) { LOG_WARN("failed to get data status", K(ret), KPC(tablet)); } else if (OB_FAIL(ObTabletDataStatus::check_can_change_status(current_status, data_status, can_change))) { LOG_WARN("failed to check can change status", K(ret), K(current_status), K(data_status), KPC(tablet)); } else if (!can_change) { ret = OB_ERR_UNEXPECTED; LOG_WARN("can not change data status", K(ret), K(current_status), K(data_status), KPC(tablet)); } else if (current_status == data_status) { LOG_INFO("data status is same, skip update", K(tablet_id), K(current_status), K(data_status)); } else if (OB_FAIL(tablet->tablet_meta_.ha_status_.set_data_status(data_status))) { LOG_WARN("failed to set data status", K(ret), KPC(tablet), K(data_status)); } else { if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) { LOG_WARN("failed to write update tablet slog", K(ret), K(tablet_handle), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle)); ob_usleep(1000 * 1000); ob_abort(); } else { time_guard.click("CASwap"); LOG_INFO("succeeded to update tablet ha data status", K(ret), K(key), K(disk_addr), K(data_status), K(tablet_handle)); } if (OB_FAIL(ret)) { int tmp_ret = OB_SUCCESS; if (OB_SUCCESS != (tmp_ret = tablet->tablet_meta_.ha_status_.set_data_status(current_status))) { LOG_WARN("failed to set data status", K(tmp_ret), K(current_status), KPC(tablet)); ob_abort(); } } } } return ret; } int ObLSTabletService::update_tablet_ha_expected_status( const common::ObTabletID &tablet_id, const ObTabletExpectedStatus::STATUS &expected_status) { int ret = OB_SUCCESS; ObTabletHandle tablet_handle; ObTabletExpectedStatus::STATUS current_status = ObTabletExpectedStatus::EXPECTED_STATUS_MAX; bool can_change = false; ObTimeGuard time_guard("ObLSTabletService::update_tablet_ha_data_status", 1_s); ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(is_stopped_)) { ret = OB_NOT_RUNNING; LOG_WARN("tablet service stopped", K(ret)); } else if (OB_UNLIKELY(!tablet_id.is_valid()) || OB_UNLIKELY(!ObTabletExpectedStatus::is_valid(expected_status))) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(expected_status)); } else if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", tablet_handle.get_obj()); } else { time_guard.click("GetTablet"); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObMetaDiskAddr disk_addr; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); ObTablet *tablet = tablet_handle.get_obj(); ObTabletHandle new_tablet_handle; if (OB_FAIL(tablet->tablet_meta_.ha_status_.get_expected_status(current_status))) { LOG_WARN("failed to get data status", K(ret), KPC(tablet)); } else if (expected_status == current_status) { LOG_INFO("tablet ha expected status is same, no need update", K(tablet_id), K(current_status), K(expected_status)); } else if (OB_FAIL(ObTabletExpectedStatus::check_can_change_status(current_status, expected_status, can_change))) { LOG_WARN("failed to check can change status", K(ret), K(current_status), K(expected_status), KPC(tablet)); } else if (!can_change) { ret = OB_ERR_UNEXPECTED; LOG_WARN("can not change meta status", K(ret), K(current_status), K(expected_status), KPC(tablet)); } else { if (OB_FAIL(tablet->tablet_meta_.ha_status_.set_expected_status(expected_status))) { LOG_WARN("failed to set ha meta status", K(ret), KPC(tablet), K(expected_status)); } else { if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tablet, new_tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tablet), K(new_tablet_handle)); } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(key.ls_id_, tablet_id, disk_addr))) { LOG_WARN("failed to write update tablet slog", K(ret), K(tablet_handle), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle), K(new_tablet_handle)); usleep(1000 * 1000); ob_abort(); } else { time_guard.click("CASwap"); LOG_INFO("succeeded to update tablet meta status", K(ret), K(key), K(disk_addr), K(expected_status), KPC(tablet)); } if (OB_FAIL(ret)) { int tmp_ret = OB_SUCCESS; if (OB_SUCCESS != (tmp_ret = tablet->tablet_meta_.ha_status_.set_expected_status(current_status))) { LOG_WARN("failed to set expected status", K(tmp_ret), K(current_status), KPC(tablet)); ob_abort(); } } } } } return ret; } int ObLSTabletService::replay_create_tablet( const ObMetaDiskAddr &disk_addr, const char *buf, const int64_t buf_len, const ObTabletID &tablet_id, ObTabletTransferInfo &tablet_transfer_info) { int ret = OB_SUCCESS; bool b_exist = false; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObFreezer *freezer = ls_->get_freezer(); const ObLSID &ls_id = ls_->get_ls_id(); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret)); } else if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) { LOG_WARN("fail to check tablet existence", K(ret), K(ls_id), K(tablet_id)); } else if (b_exist) { ret = OB_ERR_UNEXPECTED; LOG_ERROR("restart replay tablet should not exist", K(ret), K(ls_id), K(tablet_id)); } else { ObTimeGuard time_guard("ObLSTabletService::replay_create_tablet", 1_s); common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "ReplayCreate")); const ObTabletMapKey key(ls_id, tablet_id); ObTabletHandle tablet_hdl; ObTablet *tablet = nullptr; int64_t pos = 0; ObMetaDiskAddr old_addr; ObTabletPoolType pool_type; ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (OB_FAIL(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tablet_hdl))) { LOG_WARN("fail to create temporary tablet", K(ret), K(key)); } else if (FALSE_IT(tablet = tablet_hdl.get_obj())) { } else if (FALSE_IT(tablet->tablet_addr_ = disk_addr)) { } else if (OB_FAIL(t3m->get_tablet_addr(key, old_addr))) { LOG_WARN("fail to get tablet addr", K(ret), K(key)); } else if (OB_FAIL(tablet->deserialize(allocator, buf, buf_len, pos))) { LOG_WARN("fail to deserialize tablet", K(ret), K(buf), K(buf_len), K(pos)); } else if (FALSE_IT(time_guard.click("Deserialize"))) { } else if (OB_FAIL(tablet->init_shared_params(ls_id, tablet_id, tablet->get_tablet_meta().max_sync_storage_schema_version_, tablet->get_tablet_meta().max_serialized_medium_scn_, tablet->get_tablet_meta().compat_mode_, freezer))) { LOG_WARN("failed to init shared params", K(ret), K(ls_id), K(tablet_id)); } else if (OB_FAIL(tablet_id_set_.set(tablet_id))) { LOG_WARN("fail to set tablet id set", K(ret), K(tablet_id)); } else { if (tablet->is_empty_shell()) { pool_type = ObTabletPoolType::TP_NORMAL; } else { const int64_t try_cache_size = tablet->get_try_cache_size(); if (try_cache_size > ObTenantMetaMemMgr::NORMAL_TABLET_POOL_SIZE) { pool_type = ObTabletPoolType::TP_LARGE; } else { pool_type = ObTabletPoolType::TP_NORMAL; } } } if (OB_FAIL(ret)) { // do nothing } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_addr, disk_addr, pool_type, true /* whether to set tablet pool */))) { LOG_WARN("fail to compare and swap tablat in t3m", K(ret), K(key), K(old_addr), K(disk_addr)); } else if (FALSE_IT(time_guard.click("CASwap"))) { } else if (OB_FAIL(tablet->check_and_set_initial_state())) { LOG_WARN("fail to check and set initial state", K(ret), K(key)); } else if (OB_FAIL(tablet->start_ddl_if_need())) { LOG_WARN("start ddl if need failed", K(ret)); } else if (OB_FAIL(tablet->inc_macro_ref_cnt())) { LOG_WARN("fail to increase macro blocks' ref cnt for meta and data", K(ret)); } if (OB_SUCC(ret)) { tablet_transfer_info = tablet->get_tablet_meta().transfer_info_; FLOG_INFO("succeeded to replay create one tablet", K(ret), K(ls_id), K(tablet_id), KPC(tablet)); } else { int tmp_ret = OB_SUCCESS; if (OB_TMP_FAIL(tablet_id_set_.erase(tablet_id))) { if (OB_HASH_NOT_EXIST != tmp_ret) { LOG_ERROR("fail to erase tablet id from set", K(tmp_ret), K(tablet_id)); } } if (OB_TMP_FAIL(inner_remove_tablet(key.ls_id_, key.tablet_id_))) { LOG_WARN("fail to erase tablet from meta memory manager", K(tmp_ret), K(key)); } } } return ret; } int ObLSTabletService::get_tablet_with_timeout( const common::ObTabletID &tablet_id, ObTabletHandle &handle, const int64_t retry_timeout_us, const ObMDSGetTabletMode mode, const share::SCN &snapshot) { int ret = OB_SUCCESS; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); const int64_t timeout_step_us = 10 * 1000 * 1000; // 10s const int64_t snapshot_version = snapshot.get_val_for_tx(); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || mode < ObMDSGetTabletMode::READ_ALL_COMMITED)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(mode)); } else if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle, timeout_step_us, mode, snapshot_version))) { while (OB_ALLOCATE_MEMORY_FAILED == ret && ObClockGenerator::getClock() < retry_timeout_us) { ret = ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle, timeout_step_us, mode, snapshot_version); } if (OB_ALLOCATE_MEMORY_FAILED == ret) { ret = OB_TIMEOUT; LOG_WARN("get tablet timeout", K(ret), K(retry_timeout_us), K(ObTimeUtil::current_time()), K(mode)); } } return ret; } int ObLSTabletService::direct_get_tablet(const common::ObTabletID &tablet_id, ObTabletHandle &handle) { TIMEGUARD_INIT(STORAGE, 10_ms); int ret = OB_SUCCESS; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); if (CLICK_FAIL(ObTabletCreateDeleteHelper::get_tablet(key, handle))) { LOG_WARN("failed to get tablet from t3m", K(ret), K(key)); } return ret; } int ObLSTabletService::inner_table_scan( ObTabletHandle &tablet_handle, ObTableScanIterator &iter, ObTableScanParam ¶m) { // NOTICE: ObTableScanParam for_update_ param is ignored here, // upper layer will handle it, so here for_update_ is always false int ret = OB_SUCCESS; ObStoreCtx &store_ctx = iter.get_ctx_guard().get_store_ctx(); int64_t data_max_schema_version = 0; bool is_bounded_staleness_read = (NULL == param.trans_desc_) ? false : param.snapshot_.is_weak_read(); if (OB_UNLIKELY(!tablet_handle.is_valid()) || OB_UNLIKELY(!param.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_handle), K(param)); } else if (is_bounded_staleness_read && OB_FAIL(tablet_handle.get_obj()->get_max_schema_version(data_max_schema_version))) { LOG_WARN("failed to get max schema version", K(ret), K(param)); } else if (is_bounded_staleness_read && OB_FAIL(tablet_handle.get_obj()->check_schema_version_for_bounded_staleness_read( param.schema_version_, data_max_schema_version, param.index_id_))) { //check schema_version with ref_table_id, because schema_version of scan_param is from ref table LOG_WARN("check schema version for bounded staleness read fail", K(ret), K(param)); //need to get store ctx of PG, cur_key_ saves the real partition } else if (param.fb_snapshot_.is_min()) { ret = OB_SNAPSHOT_DISCARDED; } else { const int64_t snapshot_version = store_ctx.mvcc_acc_ctx_.get_snapshot_version().get_val_for_tx(); const int64_t current_time = ObClockGenerator::getClock(); const int64_t timeout = param.timeout_ - current_time; if (OB_UNLIKELY(timeout <= 0)) { ret = OB_TIMEOUT; LOG_WARN("table scan timeout", K(ret), K(current_time), "table_scan_param_timeout", param.timeout_, K(lbt())); } else if (OB_FAIL(tablet_handle.get_obj()->check_snapshot_readable_with_cache(snapshot_version, timeout))) { LOG_WARN("failed to check snapshot readable", K(ret), K(snapshot_version), K(timeout)); } else if (param.need_switch_param_) { if (OB_FAIL(iter.switch_param(param, tablet_handle))) { LOG_WARN("failed to init table scan iterator, ", K(ret)); } } else if (OB_FAIL(iter.init(param, tablet_handle))) { LOG_WARN("failed to init table scan iterator, ", K(ret)); } } if (OB_FAIL(ret)) { LOG_WARN("failed to do table scan", K(ret), K(param), K(*this), K(data_max_schema_version)); } return ret; } int ObLSTabletService::has_tablet( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, bool &b_exist) { int ret = OB_SUCCESS; b_exist = false; const ObTabletMapKey key(ls_id, tablet_id); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); if (OB_FAIL(t3m->has_tablet(key, b_exist))) { LOG_WARN("failed to check tablet exist", K(ret), K(key)); } return ret; } int ObLSTabletService::create_tablet( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, const common::ObTabletID &data_tablet_id, const share::SCN &create_scn, const int64_t snapshot_version, const share::schema::ObTableSchema &table_schema, const lib::Worker::CompatMode &compat_mode, ObTabletHandle &tablet_handle) { int ret = OB_SUCCESS; common::ObArenaAllocator tmp_allocator(common::ObMemAttr(MTL_ID(), "CreateTab")); common::ObArenaAllocator *allocator = nullptr; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); const ObTabletMapKey key(ls_id, tablet_id); ObTablet *tablet = nullptr; ObFreezer *freezer = ls_->get_freezer(); bool need_create_empty_major_sstable = false; tablet_handle.reset(); if (OB_FAIL(ObTabletCreateDeleteHelper::prepare_create_msd_tablet())) { LOG_WARN("fail to prepare create msd tablet", K(ret)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, key.tablet_id_.hash()); if (OB_FAIL(ObTabletCreateDeleteHelper::create_msd_tablet(key, tablet_handle))) { LOG_WARN("failed to create msd tablet", K(ret), K(key)); } else if (OB_ISNULL(tablet = tablet_handle.get_obj()) || OB_ISNULL(allocator = tablet_handle.get_allocator())) { ret = OB_ERR_UNEXPECTED; LOG_ERROR("new tablet is null", K(ret), KP(tablet), KP(allocator), K(tablet_handle)); } else if (OB_FAIL(ObTabletCreateDeleteHelper::check_need_create_empty_major_sstable( table_schema, need_create_empty_major_sstable))) { LOG_WARN("failed to check need create sstable", K(ret)); } else if (OB_FAIL(tablet->init_for_first_time_creation(*allocator, ls_id, tablet_id, data_tablet_id, create_scn, snapshot_version, table_schema, compat_mode, need_create_empty_major_sstable, freezer))) { LOG_WARN("failed to init tablet", K(ret), K(ls_id), K(tablet_id), K(data_tablet_id), K(create_scn), K(snapshot_version), K(table_schema), K(compat_mode)); } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) { LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle)); } else if (OB_FAIL(tablet_id_set_.set(tablet_id))) { LOG_WARN("fail to insert tablet id", K(ret), K(ls_id), K(tablet_id)); } else { report_tablet_to_rs(tablet_id); } } return ret; } int ObLSTabletService::create_inner_tablet( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, const common::ObTabletID &data_tablet_id, const share::SCN &create_scn, const int64_t snapshot_version, const share::schema::ObTableSchema &table_schema, const lib::Worker::CompatMode &compat_mode, ObTabletHandle &tablet_handle) { int ret = OB_SUCCESS; common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "LSCreateTab")); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); const ObTabletMapKey key(ls_id, tablet_id); ObTablet *tmp_tablet = nullptr; ObFreezer *freezer = ls_->get_freezer(); bool need_create_empty_major_sstable = false; ObTabletHandle tmp_tablet_hdl; ObMetaDiskAddr disk_addr; ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); if (OB_FAIL(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tmp_tablet_hdl))) { LOG_WARN("failed to create temporary tablet", K(ret), K(key)); } else if (OB_ISNULL(tmp_tablet = tmp_tablet_hdl.get_obj())) { ret = OB_ERR_UNEXPECTED; LOG_ERROR("new tablet is null", K(ret), KPC(tmp_tablet), K(tmp_tablet_hdl)); } else if (OB_FAIL(ObTabletCreateDeleteHelper::check_need_create_empty_major_sstable( table_schema, need_create_empty_major_sstable))) { LOG_WARN("failed to check need create sstable", K(ret)); } else if (OB_FAIL(tmp_tablet->init_for_first_time_creation(allocator, ls_id, tablet_id, data_tablet_id, create_scn, snapshot_version, table_schema, compat_mode, need_create_empty_major_sstable, freezer))) { LOG_WARN("failed to init tablet", K(ret), K(ls_id), K(tablet_id), K(data_tablet_id), K(create_scn), K(snapshot_version), K(table_schema), K(compat_mode)); int tmp_ret = OB_SUCCESS; if (OB_TMP_FAIL(inner_remove_tablet(ls_id, tablet_id))) { LOG_ERROR("failed to delete tablet from t3m", K(ret), K(key), K(lbt())); ob_usleep(1000 * 1000); ob_abort(); } } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), K(tmp_tablet_hdl), K(tablet_handle)); } else if (FALSE_IT(disk_addr = tablet_handle.get_obj()->get_tablet_addr())) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("failed to write update tablet slog", K(ret), K(tablet_handle)); } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) { LOG_WARN("failed to add tablet to meta mem mgr", K(ret), K(key), K(tablet_handle)); } else if (OB_FAIL(tablet_id_set_.set(tablet_id))) { LOG_ERROR("fail to set tablet id set", K(ret), K(tablet_id), K(lbt())); ob_usleep(1000 * 1000); ob_abort(); } else { LOG_INFO("create inner tablet success", K(key), K(disk_addr)); } return ret; } int ObLSTabletService::create_transfer_in_tablet( const share::ObLSID &ls_id, const ObMigrationTabletParam &tablet_meta, ObTabletHandle &tablet_handle) { int ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); const ObTabletMapKey key(ls_id, tablet_meta.tablet_id_); ObTablet *tablet = nullptr; ObFreezer *freezer = ls_->get_freezer(); common::ObArenaAllocator *allocator = nullptr; ObTabletHandle old_tablet_hdl; LOG_INFO("prepare to init transfer in tablet", K(ret), K(ls_id), K(tablet_meta)); ObTimeGuard time_guard("CreateTransferIn", 3_s); bool cover_empty_shell = false; if (!is_inited_) { ret = OB_NOT_INIT; LOG_WARN("ls tablet service do not init", K(ret)); } else if (!ls_id.is_valid() || !tablet_meta.is_valid()) { ret = OB_INVALID_ARGUMENT; LOG_WARN("create transfer in tablet get invalid argument", K(ret), K(ls_id), K(tablet_meta)); } else if (OB_FAIL(direct_get_tablet(tablet_meta.tablet_id_, old_tablet_hdl))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_SUCCESS; LOG_DEBUG("tablet not exist", K(ret), K(tablet_meta.tablet_id_)); } else { LOG_WARN("fail to get tablet", K(ret), K(tablet_meta.tablet_id_)); } } else if (!old_tablet_hdl.get_obj()->is_empty_shell()) { ret = OB_ERR_UNEXPECTED; LOG_WARN("old tablet is not empty shell", K(ret), K(old_tablet_hdl)); } else if (FALSE_IT(cover_empty_shell = true)) { // Called in mds trans callback, slog won't be written. } else if (OB_FAIL(do_remove_tablet(key))) { LOG_WARN("failed to remove tablet", K(ret), K(key)); } time_guard.click("Prepare"); if (FAILEDx(ObTabletCreateDeleteHelper::prepare_create_msd_tablet())) { LOG_WARN("failed to prepare create msd tablet", K(ret)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_meta.tablet_id_.hash()); time_guard.click("Lock"); if (FAILEDx(ObTabletCreateDeleteHelper::create_msd_tablet(key, tablet_handle))) { LOG_WARN("failed to create msd tablet", K(ret), K(key)); } else if (OB_ISNULL(tablet = tablet_handle.get_obj()) || OB_ISNULL(allocator = tablet_handle.get_allocator())) { ret = OB_ERR_UNEXPECTED; LOG_ERROR("new tablet is null", K(ret), KP(tablet), KP(allocator), K(tablet_handle)); } else if (OB_FAIL(tablet->init_with_migrate_param(*allocator, tablet_meta, false/*is_update*/, freezer))) { LOG_WARN("failed to init tablet", K(ret), K(ls_id), K(tablet_meta)); } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, tablet_handle, tablet_handle))) { LOG_WARN("failed to compare and swap tablet", K(ret), K(key), K(tablet_handle)); } else if (OB_FAIL(tablet_id_set_.set(tablet_meta.tablet_id_))) { LOG_WARN("fail to insert tablet id", K(ret), K(ls_id), K(tablet_meta)); } else { LOG_INFO("create transfer in tablet", K(ls_id), K(key), K(tablet_meta), K(cover_empty_shell)); time_guard.click("Swap"); } } return ret; } int ObLSTabletService::create_empty_shell_tablet( const ObMigrationTabletParam ¶m, ObTabletHandle &tablet_handle) { int ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); const share::ObLSID &ls_id = param.ls_id_; const common::ObTabletID &tablet_id = param.tablet_id_; const ObTabletMapKey key(ls_id, tablet_id); ObTabletHandle old_tablet_hdl; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ls tablet svr hasn't been inited", K(ret)); } else if (OB_UNLIKELY(!key.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(key)); } else if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_hdl))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_SUCCESS; LOG_DEBUG("tablet not exist", K(ret), K(tablet_id)); } else { LOG_WARN("fail to get tablet", K(ret), K(tablet_id)); } } else if (OB_FAIL(remove_tablet(old_tablet_hdl))) { LOG_WARN("failed to remove tablet", K(ret), K(key)); } ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); // must lock after prepare common::ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "MigEmptyT")); ObTabletHandle tmp_tablet_hdl; if (FAILEDx(ObTabletCreateDeleteHelper::create_tmp_tablet(key, allocator, tmp_tablet_hdl))) { LOG_WARN("fail to create temporary tablet", K(ret), K(key)); } else { ObFreezer *freezer = ls_->get_freezer(); ObTablet *tmp_tablet = tmp_tablet_hdl.get_obj(); ObTabletHandle tablet_handle; ObTablet *new_tablet = nullptr; ObMetaDiskAddr disk_addr; if (OB_FAIL(tmp_tablet->init_with_migrate_param(allocator, param, false/*is_update*/, freezer))) { LOG_WARN("failed to init tablet", K(ret), K(param)); } else if (OB_FAIL(ObTabletPersister::transform_empty_shell(*tmp_tablet, tablet_handle))) { LOG_WARN("failed to transform empty shell", K(ret), KPC(tmp_tablet)); } else if (FALSE_IT(new_tablet = tablet_handle.get_obj())) { } else if (OB_FAIL(ObTabletSlogHelper::write_empty_shell_tablet_slog(new_tablet, disk_addr))) { LOG_WARN("fail to write emtpy shell tablet slog", K(ret), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(new_tablet->tablet_addr_ = disk_addr)) { } else if (OB_FAIL(refresh_tablet_addr(ls_id, tablet_id, tablet_handle))) { LOG_WARN("failed to refresh tablet addr", K(ret), K(ls_id), K(tablet_id), K(lbt())); ob_usleep(1000 * 1000); ob_abort(); } else { ls_->get_tablet_gc_handler()->set_tablet_gc_trigger(); LOG_INFO("succeeded to create empty shell tablet", K(ret), K(key), K(param)); } } return ret; } int ObLSTabletService::rollback_tablet( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObLSHandle ls_handle; ObLS *ls = nullptr; ObTabletMapKey key(ls_id, tablet_id); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("ls tablet service do not init", K(ret)); } else if (OB_UNLIKELY(!ls_id.is_valid() || !tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("rollback tablet get invalid argument", K(ret), K(ls_id), K(tablet_id)); } else if (OB_FAIL(do_remove_tablet(key))) { LOG_WARN("failed to delete tablet", K(ret), K(key)); } else if (OB_FAIL(tablet_id_set_.erase(key.tablet_id_))) { if (OB_HASH_NOT_EXIST == ret) { ret = OB_SUCCESS; LOG_DEBUG("tablet id does not exist, maybe has not been inserted yet", K(ret), K(key)); } else { //the caller checks abort if is required. LOG_WARN("failed to erase tablet id", K(ret), K(key)); } } return ret; } int ObLSTabletService::create_memtable( const common::ObTabletID &tablet_id, const int64_t schema_version, const bool for_replay, const share::SCN clog_checkpoint_scn) { int ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObTabletHandle old_tablet_handle; const ObTabletMapKey key(ls_->get_ls_id(), tablet_id); ObTabletHandle new_tablet_handle; ObTabletMemberWrapper table_store; ObTabletMemberWrapper autoinc_seq; ObTimeGuard time_guard("ObLSTabletService::create_memtable", 10_ms); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || schema_version < 0)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(schema_version)); } else { // we need bucket lock here to protect multi version tablet creation // during tablet creating new memtable and put it into table store. ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) { LOG_WARN("fail to get tablet", K(ret), K(tablet_id)); } else if (old_tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj()); } else { time_guard.click("get tablet"); ObTablet &old_tablet = *(old_tablet_handle.get_obj()); if (OB_FAIL(old_tablet.create_memtable(schema_version, clog_checkpoint_scn, for_replay))) { if (OB_MINOR_FREEZE_NOT_ALLOW != ret) { LOG_WARN("fail to create memtable", K(ret), K(new_tablet_handle), K(schema_version), K(tablet_id)); } } else if (FALSE_IT(time_guard.click("create memtable"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, old_tablet_handle))) { LOG_WARN("fail to compare and swap tablet", K(ret), K(key), K(old_tablet_handle)); } } } return ret; } int ObLSTabletService::check_allow_to_read(AllowToReadMgr::AllowToReadInfo &read_info) { int ret = OB_SUCCESS; allow_to_read_mgr_.load_allow_to_read_info(read_info); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (!read_info.allow_to_read()) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_)); } return ret; } int ObLSTabletService::check_read_info_same(const AllowToReadMgr::AllowToReadInfo &read_info) { int ret = OB_SUCCESS; bool is_same = false; allow_to_read_mgr_.check_read_info_same(read_info, is_same); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (!is_same) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_)); } return ret; } int ObLSTabletService::get_read_tables( const common::ObTabletID &tablet_id, const int64_t snapshot_version, ObTabletTableIterator &iter, const bool allow_no_ready_read) { int ret = OB_SUCCESS; ObTabletHandle &handle = iter.tablet_handle_; iter.reset(); AllowToReadMgr::AllowToReadInfo read_info; ObTabletMapKey key; key.tablet_id_ = tablet_id; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || snapshot_version < 0)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(snapshot_version)); } else if (FALSE_IT(allow_to_read_mgr_.load_allow_to_read_info(read_info))) { } else if (!read_info.allow_to_read()) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_)); } else if (FALSE_IT(key.ls_id_ = ls_->get_ls_id())) { } else if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, handle, ObTabletCommon::DEFAULT_GET_TABLET_DURATION_US, ObMDSGetTabletMode::READ_READABLE_COMMITED, snapshot_version))) { if (OB_TABLET_NOT_EXIST != ret) { LOG_WARN("fail to check and get tablet", K(ret), K(key), K(snapshot_version)); } } else if (OB_UNLIKELY(!handle.is_valid())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected error, invalid tablet handle", K(ret), K(handle)); } else if (OB_FAIL(handle.get_obj()->get_read_tables(snapshot_version, iter, allow_no_ready_read))) { LOG_WARN("fail to get read tables", K(ret), K(handle), K(tablet_id), K(snapshot_version), K(iter), K(allow_no_ready_read)); } else { bool is_same = false; allow_to_read_mgr_.check_read_info_same(read_info, is_same); if (!is_same) { ret = OB_REPLICA_NOT_READABLE; LOG_WARN("ls is not allow to read", K(ret), KPC(ls_)); } } return ret; } int ObLSTabletService::set_tablet_status( const common::ObTabletID &tablet_id, const ObTabletCreateDeleteMdsUserData &tablet_status, mds::MdsCtx &ctx) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || !tablet_status.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_status)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); ObTabletHandle tablet_handle; if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_EAGAIN; LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id)); } else { LOG_WARN("fail to get tablet", K(ret)); } } else if (OB_FAIL(tablet_handle.get_obj()->set_tablet_status(tablet_status, ctx))) { LOG_WARN("fail to set tablet status", K(ret), K(tablet_id), K(tablet_status)); } else { LOG_INFO("succeeded to set tablet status", K(ret), K(tablet_id), K(tablet_status)); } } return ret; } int ObLSTabletService::replay_set_tablet_status( const common::ObTabletID &tablet_id, const share::SCN &scn, const ObTabletCreateDeleteMdsUserData &tablet_status, mds::MdsCtx &ctx) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || !tablet_status.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_status)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); ObTabletHandle tablet_handle; if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_EAGAIN; LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id)); } else { LOG_WARN("fail to get tablet", K(ret)); } } else if (OB_FAIL(tablet_handle.get_obj()->replay_set_tablet_status(scn, tablet_status, ctx))) { LOG_WARN("fail to replay set tablet status", K(ret), K(tablet_id), K(scn), K(tablet_status)); } else { LOG_INFO("succeeded to replay set tablet status", K(ret), K(tablet_id), K(scn), K(tablet_status)); } } return ret; } int ObLSTabletService::set_ddl_info( const common::ObTabletID &tablet_id, const ObTabletBindingMdsUserData &ddl_data, mds::MdsCtx &ctx, const int64_t timeout_us) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(ddl_data)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); ObTabletHandle tablet_handle; if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_EAGAIN; LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id)); } else { LOG_WARN("fail to get tablet", K(ret)); } } else if (OB_FAIL(tablet_handle.get_obj()->set_ddl_info(ddl_data, ctx, timeout_us))) { LOG_WARN("fail to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(timeout_us)); } else { LOG_INFO("succeeded to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(timeout_us)); } } return ret; } int ObLSTabletService::replay_set_ddl_info( const common::ObTabletID &tablet_id, const share::SCN &scn, const ObTabletBindingMdsUserData &ddl_data, mds::MdsCtx &ctx) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(ddl_data)); } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); ObTabletHandle tablet_handle; if (OB_FAIL(direct_get_tablet(tablet_id, tablet_handle))) { if (OB_TABLET_NOT_EXIST == ret) { ret = OB_EAGAIN; LOG_WARN("this tablet has been deleted, skip it", K(ret), K(tablet_id)); } else { LOG_WARN("fail to get tablet", K(ret)); } } else if (OB_FAIL(tablet_handle.get_obj()->replay_set_ddl_info(scn, ddl_data, ctx))) { LOG_WARN("fail to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(scn)); } else { LOG_INFO("succeeded to set ddl info", K(ret), K(tablet_id), K(ddl_data), K(scn)); } } return ret; } int ObLSTabletService::build_create_sstable_param_for_migration( const blocksstable::ObMigrationSSTableParam &mig_param, ObTabletCreateSSTableParam ¶m) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!mig_param.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(mig_param)); } else { param.table_key_ = mig_param.table_key_; param.schema_version_ = mig_param.basic_meta_.schema_version_; param.create_snapshot_version_ = mig_param.basic_meta_.create_snapshot_version_; param.progressive_merge_round_ = mig_param.basic_meta_.progressive_merge_round_; param.progressive_merge_step_ = mig_param.basic_meta_.progressive_merge_step_; param.is_ready_for_read_ = false; param.table_mode_ = mig_param.basic_meta_.table_mode_; param.index_type_ = static_cast(mig_param.basic_meta_.index_type_); param.rowkey_column_cnt_ = mig_param.basic_meta_.rowkey_column_count_; param.root_row_store_type_ = mig_param.basic_meta_.root_row_store_type_; param.latest_row_store_type_ = mig_param.basic_meta_.latest_row_store_type_; param.index_blocks_cnt_ = mig_param.basic_meta_.index_macro_block_count_; param.data_blocks_cnt_ = mig_param.basic_meta_.data_macro_block_count_; param.micro_block_cnt_ = mig_param.basic_meta_.data_micro_block_count_; param.use_old_macro_block_count_ = mig_param.basic_meta_.use_old_macro_block_count_; param.row_count_ = mig_param.basic_meta_.row_count_; param.column_cnt_ = mig_param.basic_meta_.column_cnt_; param.data_checksum_ = mig_param.basic_meta_.data_checksum_; param.occupy_size_ = mig_param.basic_meta_.occupy_size_; param.original_size_ = mig_param.basic_meta_.original_size_; param.max_merged_trans_version_ = mig_param.basic_meta_.max_merged_trans_version_; param.ddl_scn_ = mig_param.basic_meta_.ddl_scn_; param.filled_tx_scn_ = mig_param.basic_meta_.filled_tx_scn_; param.contain_uncommitted_row_ = mig_param.basic_meta_.contain_uncommitted_row_; param.compressor_type_ = mig_param.basic_meta_.compressor_type_; param.encrypt_id_ = mig_param.basic_meta_.encrypt_id_; param.master_key_id_ = mig_param.basic_meta_.master_key_id_; MEMCPY(param.encrypt_key_, mig_param.basic_meta_.encrypt_key_, share::OB_MAX_TABLESPACE_ENCRYPT_KEY_LENGTH); param.root_block_addr_.set_none_addr(); param.data_block_macro_meta_addr_.set_none_addr();; if (OB_FAIL(param.column_checksums_.assign(mig_param.column_checksums_))) { LOG_WARN("fail to assign column checksums", K(ret), K(mig_param)); } } return ret; } int ObLSTabletService::insert_rows( ObTabletHandle &tablet_handle, ObStoreCtx &ctx, const ObDMLBaseParam &dml_param, const common::ObIArray &column_ids, common::ObNewRowIterator *row_iter, int64_t &affected_rows) { int ret = OB_SUCCESS; NG_TRACE(S_insert_rows_begin); int64_t afct_num = 0; int64_t dup_num = 0; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!ctx.is_valid()) || !ctx.is_write() || OB_UNLIKELY(!dml_param.is_valid()) || OB_UNLIKELY(column_ids.count() <= 0) || OB_ISNULL(row_iter)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param), K(column_ids), KP(row_iter)); } else if (dml_param.is_direct_insert()) { // direct-insert mode const ObTableSchemaParam::Columns &columns = dml_param.table_param_->get_data_table().get_columns(); bool is_heap_table = columns.at(0)->is_hidden(); if (OB_FAIL(direct_insert_rows(dml_param.table_param_->get_data_table().get_table_id(), dml_param.direct_insert_task_id_, ctx.tablet_id_, is_heap_table, row_iter, afct_num))) { LOG_WARN("failed to insert rows direct", KR(ret), K(dml_param.table_param_->get_data_table().get_table_id()), K(dml_param.direct_insert_task_id_), K(ctx.tablet_id_), K(is_heap_table)); } } else { ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID()); ObDMLRunningCtx run_ctx(ctx, dml_param, ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), lob_allocator, ObDmlFlag::DF_INSERT); ObIAllocator &work_allocator = run_ctx.allocator_; void *ptr = nullptr; ObStoreRow *tbl_rows = nullptr; int64_t row_count = 0; bool first_bulk = true; ObNewRow *rows = nullptr; if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) { LOG_WARN("failed to prepare dml running ctx", K(ret)); } else { ObTabletHandle tmp_handle; SMART_VAR(ObRowsInfo, rows_info) { const ObRelativeTable &data_table = run_ctx.relative_table_; while (OB_SUCC(ret) && OB_SUCC(get_next_rows(row_iter, rows, row_count))) { ObStoreRow reserved_row; // Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle // outside the while loop. if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) { tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle(); rows_info.reset(); if (OB_FAIL(rows_info.init(data_table, ctx, tmp_handle.get_obj()->get_rowkey_read_info()))) { LOG_WARN("Failed to init rows info", K(ret), K(data_table)); } } if (OB_FAIL(ret)) { } else if (row_count <= 0) { ret = OB_ERR_UNEXPECTED; LOG_WARN("row_count should be greater than 0", K(ret)); } else if (1 == row_count) { tbl_rows = &reserved_row; tbl_rows[0].flag_.set_flag(ObDmlFlag::DF_INSERT); } else if (first_bulk) { first_bulk = false; if (OB_ISNULL(ptr = work_allocator.alloc(row_count * sizeof(ObStoreRow)))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_ERROR("fail to allocate memory", K(ret), K(row_count)); } else { tbl_rows = new (ptr) ObStoreRow[row_count]; for (int64_t i = 0; i < row_count; i++) { tbl_rows[i].flag_.set_flag(ObDmlFlag::DF_INSERT); } } } if (OB_FAIL(ret)) { } else if (OB_ISNULL(tbl_rows)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected error, tbl_rows is NULL", K(ret), KP(tbl_rows)); } else if (OB_FAIL(insert_rows_to_tablet(tablet_handle, run_ctx, rows, row_count, rows_info, tbl_rows, afct_num, dup_num))) { LOG_WARN("insert to each tablets fail", K(ret)); } } } else { LOG_WARN("Failed to allocate ObRowsInfo", K(ret)); } lob_allocator.reuse(); } if (OB_ITER_END == ret) { ret = OB_SUCCESS; } if (nullptr != ptr) { work_allocator.free(ptr); } lob_allocator.reset(); } if (OB_SUCC(ret)) { LOG_DEBUG("succeeded to insert rows", K(ret)); affected_rows = afct_num; EVENT_ADD(STORAGE_INSERT_ROW_COUNT, afct_num); } NG_TRACE(S_insert_rows_end); return ret; } int ObLSTabletService::direct_insert_rows( const uint64_t table_id, const int64_t task_id, const ObTabletID &tablet_id, const bool is_heap_table, ObNewRowIterator *row_iter, int64_t &affected_rows) { int ret = OB_SUCCESS; ObTableLoadTableCtx *table_ctx = nullptr; ObTableLoadKey key(MTL_ID(), table_id); if (OB_FAIL(ObTableLoadService::get_ctx(key, table_ctx))) { LOG_WARN("fail to get table ctx", KR(ret), K(key)); } else { int64_t row_count = 0; ObNewRow *rows = nullptr; table::ObTableLoadTransId trans_id; trans_id.segment_id_ = task_id; trans_id.trans_gid_ = 1; ObTableLoadStore store(table_ctx); if (OB_FAIL(store.init())) { LOG_WARN("fail to init store", KR(ret)); } while (OB_SUCC(ret) && OB_SUCC(get_next_rows(row_iter, rows, row_count))) { if (row_count <= 0) { ret = OB_ERR_UNEXPECTED; LOG_WARN("row_count should be greater than 0", K(ret)); } else { common::ObArray row_array; for (int64_t i = 0; OB_SUCC(ret) && (i < row_count); ++i) { ObNewRow new_row; if (is_heap_table) { new_row.assign(rows[i].cells_ + 1, rows[i].count_ - 1); } else { new_row.assign(rows[i].cells_, rows[i].count_); } if (OB_FAIL(row_array.push_back(new_row))) { LOG_WARN("failed to push back row to row_array", KR(ret), K(i), K(new_row)); } } if (OB_SUCC(ret)) { if (OB_FAIL(store.px_write(trans_id, tablet_id, row_array))) { LOG_WARN("failed to write to store", KR(ret), K(trans_id), K(table_id), K(tablet_id), K(row_array)); } else { affected_rows += row_count; } } } } if (OB_ITER_END == ret) { ret = OB_SUCCESS; } } if (OB_NOT_NULL(table_ctx)) { ObTableLoadService::put_ctx(table_ctx); table_ctx = nullptr; } return ret; } int ObLSTabletService::insert_row( ObTabletHandle &tablet_handle, ObStoreCtx &ctx, const ObDMLBaseParam &dml_param, const common::ObIArray &column_ids, const common::ObIArray &duplicated_column_ids, const common::ObNewRow &row, const ObInsertFlag flag, int64_t &affected_rows, common::ObNewRowIterator *&duplicated_rows) { int ret = OB_SUCCESS; const ObTabletID &data_tablet_id = ctx.tablet_id_; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!ctx.is_valid() || !ctx.is_write() || !dml_param.is_valid() || column_ids.count() <= 0 || duplicated_column_ids.count() <= 0 || !row.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param), K(column_ids), K(duplicated_column_ids), K(row), K(flag)); } else { ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID()); ObDMLRunningCtx run_ctx(ctx, dml_param, ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), lob_allocator, ObDmlFlag::DF_INSERT); ObIAllocator &work_allocator = run_ctx.allocator_; duplicated_rows = nullptr; ObStoreRow &tbl_row = run_ctx.tbl_row_; const ObRelativeTable &data_table = run_ctx.relative_table_; if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) { LOG_WARN("failed to prepare dml running ctx", K(ret)); } else { tbl_row.flag_.set_flag(ObDmlFlag::DF_INSERT); tbl_row.row_val_ = row; if (OB_FAIL(get_conflict_rows(tablet_handle, run_ctx, flag, duplicated_column_ids, tbl_row.row_val_, duplicated_rows))) { LOG_WARN("failed to get conflict row(s)", K(ret), K(duplicated_column_ids), K(row)); } else if (nullptr == duplicated_rows) { if (OB_FAIL(insert_row_to_tablet(tablet_handle, run_ctx, tbl_row))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret) { LOG_WARN("failed to write row", K(ret)); } } else { LOG_DEBUG("succeeded to insert row", K(ret), K(row)); affected_rows = 1; EVENT_INC(STORAGE_INSERT_ROW_COUNT); } } else { ret = OB_ERR_PRIMARY_KEY_DUPLICATE; } } lob_allocator.reset(); } return ret; } static inline bool is_lob_update(ObDMLRunningCtx &run_ctx, const ObIArray &update_idx) { bool bool_ret = false; for (int64_t i = 0; i < update_idx.count() && !bool_ret; ++i) { int64_t idx = update_idx.at(i); if (run_ctx.col_descs_->at(idx).col_type_.is_lob_storage()) { bool_ret = true; } } return bool_ret; } int ObLSTabletService::update_rows( ObTabletHandle &tablet_handle, ObStoreCtx &ctx, const ObDMLBaseParam &dml_param, const ObIArray &column_ids, const ObIArray< uint64_t> &updated_column_ids, ObNewRowIterator *row_iter, int64_t &affected_rows) { int ret = OB_SUCCESS; NG_TRACE(S_update_rows_begin); const ObTabletID &data_tablet_id = ctx.tablet_id_; int64_t afct_num = 0; int64_t dup_num = 0; int64_t got_row_count = 0; ObTimeGuard timeguard(__func__, 3 * 1000 * 1000); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!ctx.is_valid() || !ctx.is_write() || !dml_param.is_valid() || column_ids.count() <= 0 || updated_column_ids.count() <= 0 || nullptr == row_iter)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param), K(column_ids), K(updated_column_ids), KP(row_iter)); } else { timeguard.click("Get"); ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID()); ObDMLRunningCtx run_ctx(ctx, dml_param, ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), lob_allocator, ObDmlFlag::DF_UPDATE); ObIAllocator &work_allocator = run_ctx.allocator_; ObStoreRow old_tbl_row; void *old_row_cells = nullptr; ObStoreRow &new_tbl_row = run_ctx.tbl_row_; bool rowkey_change = false; UpdateIndexArray update_idx; ObRowStore row_store; bool delay_new = false; bool lob_update = false; const ObRelativeTable &relative_table = run_ctx.relative_table_; if (OB_FAIL(prepare_dml_running_ctx(&column_ids, &updated_column_ids, tablet_handle, run_ctx))) { LOG_WARN("failed to prepare dml running ctx", K(ret)); } else if (FALSE_IT(tablet_handle.reset())) { } else if (FALSE_IT(timeguard.click("Prepare"))) { } else if (OB_UNLIKELY(!relative_table.is_valid())) { ret = OB_ERR_SYS; LOG_ERROR("data table is not prepared", K(ret)); } else if (OB_FAIL(construct_update_idx(relative_table.get_rowkey_column_num(), run_ctx.col_map_, updated_column_ids, update_idx))) { LOG_WARN("failed to construct update_idx", K(ret), K(updated_column_ids)); } else if (FALSE_IT(timeguard.click("Construct"))) { } else if (OB_FAIL(check_rowkey_change(updated_column_ids, relative_table, rowkey_change, delay_new))) { LOG_WARN("failed to check rowkey changes", K(ret)); } else { timeguard.click("Check"); const int64_t num = relative_table.get_column_count(); if (OB_ISNULL(old_row_cells = work_allocator.alloc( static_cast(sizeof(common::ObObj) * num)))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_ERROR("failed to malloc temp row cells", K(ret)); } else { timeguard.click("AllocOld"); old_tbl_row.row_val_.cells_ = new (old_row_cells) ObObj[num](); old_tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE); new_tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE); } lob_update = is_lob_update(run_ctx, update_idx); } int64_t cur_time = 0; ObTabletHandle tmp_handle; while (OB_SUCC(ret) && OB_SUCC(get_next_row_from_iter(row_iter, old_tbl_row, true)) && OB_SUCC(get_next_row_from_iter(row_iter, new_tbl_row, false))) { LOG_DEBUG("get_dml_update_row", KP(row_iter), K(old_tbl_row), K(new_tbl_row)); // Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle // outside the while loop. if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) { tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle(); } bool duplicate = false; ++got_row_count; cur_time = ObClockGenerator::getClock(); if ((0 == (0x1FF & got_row_count)) && (cur_time > dml_param.timeout_)) { //checking timeout cost too much, so check every 512 rows ret = OB_TIMEOUT; LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret)); } else if (OB_FAIL(update_row_to_tablet(tmp_handle, run_ctx, rowkey_change, update_idx, delay_new, lob_update, old_tbl_row, new_tbl_row, &row_store, duplicate))) { LOG_WARN("failed to update row to tablets", K(ret), K(old_tbl_row), K(new_tbl_row)); } else if (duplicate) { dup_num++; } else { afct_num++; } lob_allocator.reuse(); timeguard.click("Update"); } if (OB_ITER_END == ret) { ret = OB_SUCCESS; } if (OB_SUCC(ret) && row_store.get_row_count() > 0) { void *ptr1 = nullptr; const int64_t num = relative_table.get_column_count(); if (OB_ISNULL(ptr1 = work_allocator.alloc(sizeof(common::ObObj) * num))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_ERROR("failed to malloc temp row cells", K(ret)); } else { timeguard.click("AllocNew"); new_tbl_row.row_val_.cells_ = new(ptr1) ObObj[num](); ObRowStore::Iterator row_iter2 = row_store.begin(); ObTabletHandle tmp_handle; // when total_quantity_log is true, we should iterate new_tbl_row and old_tbl_row, and // dispose these two rows together, otherwise, when total_quantity_log is false, // row_iter2 doesn't contain old rows, and old_tbl_row is a dummy param in process_new_row while (OB_SUCC(ret) && OB_SUCC(row_iter2.get_next_row(new_tbl_row.row_val_))) { // Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle // outside the while loop. if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) { tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle(); } int64_t data_tbl_rowkey_len = relative_table.get_rowkey_column_num(); bool tbl_rowkey_change = false; if (OB_FAIL(row_iter2.get_next_row(old_tbl_row.row_val_))) { LOG_WARN("fail to get row from row stores", K(ret)); } else if (FALSE_IT(timeguard.click("GetNext"))) { } else if (rowkey_change && OB_FAIL(check_rowkey_value_change(old_tbl_row.row_val_, new_tbl_row.row_val_, data_tbl_rowkey_len, tbl_rowkey_change))) { LOG_WARN("check data table rowkey change failed", K(ret), K(old_tbl_row), K(new_tbl_row), K(data_tbl_rowkey_len)); } else if (OB_FAIL(process_new_row(tmp_handle, run_ctx, update_idx, old_tbl_row, new_tbl_row, tbl_rowkey_change))) { LOG_WARN("fail to process new row", K(ret), K(old_tbl_row), K(new_tbl_row)); } timeguard.click("Process"); } work_allocator.free(ptr1); ptr1 = nullptr; new_tbl_row.row_val_.cells_ = nullptr; } } if (OB_ITER_END == ret) { ret = OB_SUCCESS; } if (nullptr != old_row_cells) { work_allocator.free(old_row_cells); } lob_allocator.reset(); old_tbl_row.row_val_.cells_ = nullptr; if (OB_SUCC(ret)) { affected_rows = afct_num; EVENT_ADD(STORAGE_UPDATE_ROW_COUNT, afct_num); } if (timeguard.get_diff() > 3 * 1000 * 1000) { LOG_WARN_RET(OB_ERR_TOO_MUCH_TIME, "update rows use too much time", K(afct_num), K(got_row_count)); } } NG_TRACE(S_update_rows_end); return ret; } int ObLSTabletService::put_rows( ObTabletHandle &tablet_handle, ObStoreCtx &ctx, const ObDMLBaseParam &dml_param, const ObIArray &column_ids, ObNewRowIterator *row_iter, int64_t &affected_rows) { int ret = OB_SUCCESS; const ObTabletID &data_tablet_id = ctx.tablet_id_; int64_t afct_num = 0; ObTimeGuard timeguard(__func__, 3 * 1000 * 1000); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!ctx.is_valid()) || OB_UNLIKELY(!ctx.is_write()) || OB_UNLIKELY(!dml_param.is_valid()) || OB_UNLIKELY(column_ids.count() <= 0) || OB_ISNULL(row_iter)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ctx), K(dml_param), K(column_ids), KP(row_iter)); } else { ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID()); ObDMLRunningCtx run_ctx(ctx, dml_param, ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), lob_allocator, ObDmlFlag::DF_UPDATE); ObIAllocator &work_allocator = run_ctx.allocator_; ObNewRow *row = nullptr; ObStoreRow &tbl_row = run_ctx.tbl_row_; const ObRelativeTable &data_table = run_ctx.relative_table_; if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) { LOG_WARN("failed to prepare dml running ctx", K(ret)); } else { tablet_handle.reset(); tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE); } int64_t cur_time = 0; ObTabletHandle tmp_handle; while (OB_SUCC(ret) && OB_SUCC(row_iter->get_next_row(row))) { // Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle // outside the while loop. if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) { tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle(); } cur_time = ObClockGenerator::getClock(); tbl_row.row_val_ = *row; if (cur_time > dml_param.timeout_) { ret = OB_TIMEOUT; LOG_WARN("query timeout", K(ret), K(cur_time), K(dml_param)); } else if (OB_FAIL(insert_row_to_tablet(tmp_handle, run_ctx, tbl_row))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("failed to write row", K(ret)); } } ++afct_num; lob_allocator.reuse(); } if (OB_ITER_END == ret) { ret = OB_SUCCESS; } lob_allocator.reset(); if (OB_SUCC(ret)) { affected_rows = afct_num; EVENT_ADD(STORAGE_INSERT_ROW_COUNT, afct_num); } } return ret; } int ObLSTabletService::delete_rows( ObTabletHandle &tablet_handle, ObStoreCtx &ctx, const ObDMLBaseParam &dml_param, const ObIArray &column_ids, ObNewRowIterator *row_iter, int64_t &affected_rows) { int ret = OB_SUCCESS; NG_TRACE(S_delete_rows_begin); const ObTabletID &data_tablet_id = ctx.tablet_id_; ObRowReshape *row_reshape = nullptr; int64_t afct_num = 0; ObTimeGuard timeguard(__func__, 3 * 1000 * 1000); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_ISNULL(row_iter) || !ctx.is_valid() || !ctx.is_write() || column_ids.count() <= 0 || OB_ISNULL(row_iter)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(dml_param), K(column_ids), KP(row_iter), K(ctx)); } else { ObArenaAllocator lob_allocator(ObModIds::OB_LOB_ACCESS_BUFFER, OB_MALLOC_NORMAL_BLOCK_SIZE, MTL_ID()); ObDMLRunningCtx run_ctx(ctx, dml_param, ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), lob_allocator, ObDmlFlag::DF_DELETE); ObNewRow *row = nullptr; if (OB_FAIL(prepare_dml_running_ctx(&column_ids, nullptr, tablet_handle, run_ctx))) { LOG_WARN("failed to prepare dml running ctx", K(ret)); } else { tablet_handle.reset(); } // delete table rows int64_t cur_time = 0; ObTabletHandle tmp_handle; while (OB_SUCC(ret) && OB_SUCC(row_iter->get_next_row(row))) { // Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle // outside the while loop. if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) { tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle(); } cur_time = ObClockGenerator::getClock(); if (cur_time > run_ctx.dml_param_.timeout_) { ret = OB_TIMEOUT; LOG_WARN("query timeout", K(cur_time), K(run_ctx.dml_param_), K(ret)); } else if (OB_ISNULL(row)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("get next row from iterator failed", KP(row), K(ret)); } else if (OB_FAIL(delete_row_in_tablet(tmp_handle, run_ctx, *row))) { LOG_WARN("fail to delete row", K(ret), K(row)); } else { ++afct_num; } lob_allocator.reuse(); } lob_allocator.reset(); if (OB_ITER_END == ret) { ret = OB_SUCCESS; } if (OB_SUCC(ret)) { affected_rows = afct_num; EVENT_ADD(STORAGE_DELETE_ROW_COUNT, afct_num); } } NG_TRACE(S_delete_rows_end); return ret; } int ObLSTabletService::lock_rows( ObTabletHandle &tablet_handle, ObStoreCtx &ctx, const ObDMLBaseParam &dml_param, const int64_t abs_lock_timeout, const ObLockFlag lock_flag, const bool is_sfu, ObNewRowIterator *row_iter, int64_t &affected_rows) { UNUSEDx(lock_flag, is_sfu); NG_TRACE(S_lock_rows_begin); int ret = OB_SUCCESS; const ObTabletID &data_tablet_id = ctx.tablet_id_; ObTimeGuard timeguard(__func__, 3 * 1000 * 1000); int64_t afct_num = 0; ObColDescArray col_desc; common::ObSEArray column_ids; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("tablet service is not initialized", K(ret)); } else if (OB_UNLIKELY(!ctx.is_valid() || !ctx.is_write() || !dml_param.is_valid() || OB_ISNULL(row_iter))) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(ctx), K(dml_param), KPC(row_iter)); } else { timeguard.click("Get"); ObDMLRunningCtx run_ctx(ctx, dml_param, ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), ObDmlFlag::DF_LOCK); ObNewRow *row = nullptr; if (OB_FAIL(prepare_dml_running_ctx(nullptr, nullptr, tablet_handle, run_ctx))) { LOG_WARN("failed to prepare dml running ctx", K(ret)); } else if (FALSE_IT(tablet_handle.reset())) { } else if (FALSE_IT(timeguard.click("Prepare"))) { } else if (OB_FAIL(run_ctx.relative_table_.get_rowkey_column_ids(col_desc))) { LOG_WARN("Fail to get column desc", K(ret)); } else if (OB_FAIL(run_ctx.relative_table_.get_rowkey_column_ids(column_ids))) { LOG_WARN("Fail to get column ids", K(ret)); } else { timeguard.click("GetIds"); run_ctx.column_ids_ = &column_ids; ctx.mvcc_acc_ctx_.abs_lock_timeout_ = ObTablet::get_lock_wait_timeout(abs_lock_timeout, dml_param.timeout_); ObTabletHandle tmp_handle; while (OB_SUCCESS == ret && OB_SUCC(row_iter->get_next_row(row))) { // Let ObStorageTableGuard refresh retired memtable, should not hold origin tablet handle // outside the while loop. if (tmp_handle.get_obj() != run_ctx.relative_table_.tablet_iter_.get_tablet_handle().get_obj()) { tmp_handle = run_ctx.relative_table_.tablet_iter_.get_tablet_handle(); } ObRelativeTable &relative_table = run_ctx.relative_table_; bool is_exists = true; if (ObTimeUtility::current_time() > dml_param.timeout_) { ret = OB_TIMEOUT; int64_t cur_time = ObClockGenerator::getClock(); LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret)); } else if (GCONF.enable_defensive_check() && OB_FAIL(check_old_row_legitimacy(tmp_handle, run_ctx, *row))) { LOG_WARN("check row legitimacy failed", K(ret), KPC(row)); } else if (GCONF.enable_defensive_check() && OB_FAIL(check_new_row_nullable_value(col_desc, relative_table, *row))) { LOG_WARN("check lock row nullable failed", K(ret)); } else if (FALSE_IT(timeguard.click("Check"))) { } else if (OB_FAIL(tmp_handle.get_obj()->lock_row(run_ctx.relative_table_, ctx, *row))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret) { LOG_WARN("failed to lock row", K(*row), K(ret)); } } else { ++afct_num; } timeguard.click("Lock"); } if (OB_ITER_END == ret) { ret = OB_SUCCESS; affected_rows = afct_num; } } } NG_TRACE(S_lock_rows_end); return ret; } int ObLSTabletService::lock_row( ObTabletHandle &tablet_handle, ObStoreCtx &ctx, const ObDMLBaseParam &dml_param, const int64_t abs_lock_timeout, const ObNewRow &row, const ObLockFlag lock_flag, const bool is_sfu) { UNUSEDx(lock_flag, is_sfu); int ret = OB_SUCCESS; const ObTabletID &data_tablet_id = ctx.tablet_id_; ObTimeGuard timeguard(__func__, 3 * 1000 * 1000); int64_t afct_num = 0; ObColDescArray col_desc; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("tablet service is not initialized", K(ret)); } else if (OB_UNLIKELY(!ctx.is_valid() || !dml_param.is_valid() || !row.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(ctx), K(dml_param), K(row)); } else { ObDMLRunningCtx run_ctx(ctx, dml_param, ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), ctx.mvcc_acc_ctx_.mem_ctx_->get_query_allocator(), ObDmlFlag::DF_LOCK); if (OB_FAIL(prepare_dml_running_ctx(nullptr, nullptr, tablet_handle, run_ctx))) { LOG_WARN("failed to prepare dml running ctx", K(ret)); } else if (OB_FAIL(run_ctx.relative_table_.get_rowkey_column_ids(col_desc))) { LOG_WARN("Fail to get column desc", K(ret)); } else { ctx.mvcc_acc_ctx_.abs_lock_timeout_ = ObTablet::get_lock_wait_timeout(abs_lock_timeout, dml_param.timeout_); if (ObTimeUtility::current_time() > dml_param.timeout_) { ret = OB_TIMEOUT; int64_t cur_time = ObClockGenerator::getClock(); LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret)); } else if (OB_FAIL(tablet_handle.get_obj()->lock_row(run_ctx.relative_table_, ctx, row))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret) { LOG_WARN("failed to lock row", K(row), K(ret)); } } else { ++afct_num; } } } return ret; } int ObLSTabletService::trim_rebuild_tablet( const ObTabletID &tablet_id, const bool is_rollback) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(is_stopped_)) { ret = OB_NOT_RUNNING; LOG_WARN("tablet service stopped", K(ret)); } else if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(tablet_id)); } else if (is_rollback && OB_FAIL(rollback_rebuild_tablet(tablet_id))) { LOG_WARN("failed to rollback tablet rebuilt", K(ret), K(is_rollback), K(tablet_id)); } else if (!is_rollback && OB_FAIL(trim_old_tablets(tablet_id))) { LOG_WARN("failed to trim old tablets", K(ret), K(is_rollback), K(tablet_id)); } return ret; } int ObLSTabletService::create_or_update_migration_tablet( const ObMigrationTabletParam &mig_tablet_param, const bool is_transfer) { // TODO: is_transfer may be redundant, temporarily unused UNUSEDx(is_transfer); int ret = OB_SUCCESS; const share::ObLSID &ls_id = mig_tablet_param.ls_id_; const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_; ObTabletHandle tablet_handle; bool b_exist = false; const bool need_create_msd_tablet = mig_tablet_param.is_empty_shell(); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(is_stopped_)) { ret = OB_NOT_RUNNING; LOG_WARN("tablet service stopped", K(ret)); } else if (!mig_tablet_param.is_empty_shell() && (OB_UNLIKELY(!mig_tablet_param.is_valid()) || OB_UNLIKELY(ls_id != ls_->get_ls_id()))) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(mig_tablet_param), K_(ls)); } else if (need_create_msd_tablet) { if (OB_FAIL(create_empty_shell_tablet(mig_tablet_param, tablet_handle))) { LOG_WARN("failed to create empty shell tablet", K(ret), K(tablet_id), K(mig_tablet_param)); } } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) { LOG_WARN("failed to check tablet existence", K(ls_id), K(tablet_id)); } else if (b_exist && OB_FAIL(migrate_update_tablet(mig_tablet_param))) { LOG_WARN("failed to update tablet meta", K(ret), K(tablet_id), K(mig_tablet_param)); } else if (!b_exist && OB_FAIL(migrate_create_tablet(mig_tablet_param, tablet_handle))) { LOG_WARN("failed to migrate create tablet", K(ret), K(mig_tablet_param)); } } return ret; } int ObLSTabletService::rebuild_create_tablet( const ObMigrationTabletParam &mig_tablet_param, const bool keep_old) { int ret = OB_SUCCESS; const share::ObLSID &ls_id = mig_tablet_param.ls_id_; const common::ObTabletID &tablet_id = mig_tablet_param.tablet_id_; const ObTabletMapKey key(ls_id, tablet_id); bool b_exist = false; const bool need_create_msd_tablet = mig_tablet_param.is_empty_shell() && !keep_old; ObTabletHandle new_tablet_handle; ObTabletHandle old_tablet_handle; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(is_stopped_)) { ret = OB_NOT_RUNNING; LOG_WARN("tablet service stopped", K(ret)); } else if (OB_UNLIKELY(!mig_tablet_param.is_valid()) || OB_UNLIKELY(ls_id != ls_->get_ls_id())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(mig_tablet_param), K_(ls)); } else if (OB_UNLIKELY(mig_tablet_param.is_empty_shell() && keep_old)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected error, rebuild create an empty shell tablet, but still need the old tablet", K(ret), K(mig_tablet_param), K(keep_old)); } else if (need_create_msd_tablet) { if (OB_FAIL(create_empty_shell_tablet(mig_tablet_param, new_tablet_handle))) { LOG_WARN("failed to create empty shell tablet", K(ret), K(tablet_id), K(mig_tablet_param)); } } else { ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) { LOG_WARN("fail to check tablet existence", K(ls_id), K(tablet_id)); } else if (!b_exist && OB_FAIL(migrate_create_tablet(mig_tablet_param, new_tablet_handle))) { LOG_WARN("failed to rebuild create tablet", K(ret), K(tablet_id), K(mig_tablet_param)); } else if (b_exist && !keep_old && OB_FAIL(migrate_update_tablet(mig_tablet_param))) { LOG_WARN("failed to rebuild create tablet", K(ret), K(tablet_id), K(mig_tablet_param)); } else if (b_exist && keep_old) { if (OB_FAIL(ObTabletCreateDeleteHelper::check_and_get_tablet(key, old_tablet_handle, ObTabletCommon::DEFAULT_GET_TABLET_DURATION_US, ObMDSGetTabletMode::READ_WITHOUT_CHECK, ObTransVersion::MAX_TRANS_VERSION))) { LOG_WARN("failed to check and get tablet", K(ret), K(key)); } else if (OB_UNLIKELY(old_tablet_handle.get_obj()->get_tablet_meta().has_next_tablet_)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("number of nodes on list exceeds 2", K(ret)); } else if (OB_FAIL(rebuild_tablet_with_old(mig_tablet_param, old_tablet_handle))) { LOG_WARN("failed to rebuild tablet and maintain linked list", K(ret), K(tablet_id)); } } } return ret; } int ObLSTabletService::build_ha_tablet_new_table_store( const ObTabletID &tablet_id, const ObBatchUpdateTableStoreParam ¶m) { int ret = OB_SUCCESS; ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "BuildHaTab")); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObMetaDiskAddr disk_addr; ObTimeGuard time_guard("ObLSTabletService::build_ha_tablet_new_table_store", 1_s); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(is_stopped_)) { ret = OB_NOT_RUNNING; LOG_WARN("tablet service stopped", K(ret)); } else if (OB_UNLIKELY(!tablet_id.is_valid() || !param.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_id), K(param)); } else { ObTabletHandle old_tablet_handle; ObTabletHandle tmp_tablet_handle; ObTabletHandle new_tablet_handle; ObBucketHashWLockGuard lock_guard(bucket_lock_, tablet_id.hash()); time_guard.click("Lock"); if (OB_FAIL(direct_get_tablet(tablet_id, old_tablet_handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (old_tablet_handle.get_obj()->is_empty_shell()) { LOG_INFO("old tablet is empty shell tablet, should skip this operation", K(ret), "old_tablet", old_tablet_handle.get_obj()); } else { time_guard.click("GetTablet"); ObTablet *old_tablet = old_tablet_handle.get_obj(); ObTablet *tmp_tablet = nullptr; const share::ObLSID &ls_id = ls_->get_ls_id(); const ObTabletMapKey key(ls_id, tablet_id); if (OB_FAIL(ObTabletCreateDeleteHelper::acquire_tmp_tablet(key, allocator, tmp_tablet_handle))) { LOG_WARN("failed to acquire tablet", K(ret), K(key)); } else if (FALSE_IT(tmp_tablet = tmp_tablet_handle.get_obj())) { } else if (OB_FAIL(tmp_tablet->init_for_sstable_replace(allocator, param, *old_tablet))) { LOG_WARN("failed to init tablet", K(ret), KPC(old_tablet)); } else if (FALSE_IT(time_guard.click("InitTablet"))) { } else if (OB_FAIL(ObTabletPersister::persist_and_transform_tablet(*tmp_tablet, new_tablet_handle))) { LOG_WARN("fail to persist and transform tablet", K(ret), KPC(tmp_tablet), K(new_tablet_handle)); } else if (FALSE_IT(time_guard.click("Persist"))) { } else if (FALSE_IT(disk_addr = new_tablet_handle.get_obj()->tablet_addr_)) { } else if (OB_FAIL(ObTabletSlogHelper::write_update_tablet_slog(ls_id, tablet_id, disk_addr))) { LOG_WARN("fail to write update tablet slog", K(ret), K(ls_id), K(tablet_id), K(disk_addr)); } else if (FALSE_IT(time_guard.click("WrSlog"))) { } else if (OB_FAIL(t3m->compare_and_swap_tablet(key, old_tablet_handle, new_tablet_handle))) { LOG_ERROR("failed to compare and swap tablet", K(ret), K(key), K(disk_addr)); ob_usleep(1000 * 1000); ob_abort(); } else { time_guard.click("CASwap"); LOG_INFO("succeed to build ha tablet new table store", K(ret), K(key), K(disk_addr), K(param)); } } } return ret; } int ObLSTabletService::need_check_old_row_legitimacy(ObDMLRunningCtx &run_ctx, bool &need_check, bool &is_udf) { int ret = OB_SUCCESS; ObRelativeTable &data_table = run_ctx.relative_table_; need_check = false; const ObDMLBaseParam &dml_param = run_ctx.dml_param_; is_udf = false; // TODO(jingxing): setting this to true if (OB_FAIL(data_table.has_udf_column(need_check))) { LOG_WARN("check has udf column failed", K(ret)); } else if (need_check) { is_udf = true; ObTableStoreIterator &table_iter = *data_table.tablet_iter_.table_iter(); while (OB_SUCC(ret) && !need_check) { ObITable *table_ptr = nullptr; if (OB_FAIL(table_iter.get_next(table_ptr))) { if (OB_ITER_END != ret) { LOG_WARN("get next table failed", K(ret)); } } else if (OB_ISNULL(table_ptr)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("error unexpected, table ptr must not be nullptr", K(ret)); } else { need_check = table_ptr->is_major_sstable(); } } } else if (dml_param.is_batch_stmt_ && !data_table.is_index_table()) { //batch stmt execution dependency defensive check to check //if the same row was modified multiple times need_check = true; ret = OB_E(EventTable::EN_INS_MULTI_VALUES_BATCH_OPT) OB_SUCCESS; // no need to check old row, just for bmsql performance optimization // TODO yuchen.ywc if (OB_SUCCESS != ret) { LOG_INFO("error sim when current statement is batch update", K(ret), K(is_udf)); need_check = false; ret = OB_SUCCESS; } } else if (GCONF.enable_defensive_check()) { need_check = true; if (data_table.is_index_table() && !data_table.can_read_index()) { //index can not be read during building index, so does not check old index row need_check = false; } if (ObDmlFlag::DF_LOCK == run_ctx.dml_flag_) { need_check = false; } } return ret; } int ObLSTabletService::construct_table_rows( const ObNewRow *rows, ObStoreRow *tbl_rows, int64_t row_count) { int ret = OB_SUCCESS; if (row_count <= 0) { ret = OB_ERR_WRONG_VALUE_COUNT_ON_ROW; LOG_WARN("row count should be bigger than 0", K(row_count), K(ret)); } else { for (int64_t i = 0; i < row_count; i++) { tbl_rows[i].row_val_ = rows[i]; } } return ret; } int ObLSTabletService::check_old_row_legitimacy( ObTabletHandle &data_tablet_handle, ObDMLRunningCtx &run_ctx, const common::ObNewRow &old_row) { int ret = OB_SUCCESS; ObRelativeTable &data_table = run_ctx.relative_table_; ObStoreRowkey rowkey; bool need_check = false; bool is_udf = false; rowkey.assign(old_row.cells_, data_table.get_rowkey_column_num()); if (OB_UNLIKELY(rowkey.get_obj_cnt() > old_row.count_) || OB_ISNULL(run_ctx.column_ids_)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("old row is invalid", K(ret), K(old_row), K(rowkey.get_obj_cnt()), KP(run_ctx.column_ids_)); } else if (OB_FAIL(need_check_old_row_legitimacy(run_ctx, need_check, is_udf))) { LOG_WARN("identify need check old row legitimacy", K(ret)); } else if (need_check) { //the vertical partition is no longer maintained, //and the defense check skips the vertical partition function const ObDMLBaseParam &dml_param = run_ctx.dml_param_; ObArenaAllocator scan_allocator(common::ObMemAttr(MTL_ID(), ObModIds::OB_TABLE_SCAN_ITER)); ObIAllocator *allocator = &scan_allocator; ObSingleRowGetter old_row_getter(*allocator, *data_tablet_handle.get_obj()); ObNewRow *storage_old_row = nullptr; //check old row whether different with SQL.old_row, ObDatumRowkey datum_rowkey; ObDatumRowkeyHelper rowkey_helper; const ObIArray &column_ids = *run_ctx.column_ids_; uint64_t err_col_id = OB_INVALID_ID; if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) { STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(rowkey)); } else if (OB_FAIL(init_single_row_getter(old_row_getter, run_ctx, column_ids, data_table, true))) { LOG_WARN("failed to init single row getter", K(ret)); } else if (OB_FAIL(old_row_getter.open(datum_rowkey, true))) { LOG_WARN("open old row getter failed", K(ret), K(rowkey)); } else if (OB_FAIL(old_row_getter.get_next_row(storage_old_row))) { if (OB_ITER_END == ret) { ret = OB_ERR_DEFENSIVE_CHECK; FLOG_WARN("old row in storage is not exists", K(ret)); } else { LOG_WARN("get next row from old_row_iter failed", K(ret), KPC(run_ctx.column_ids_), K(old_row)); } } else if (OB_ISNULL(storage_old_row)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected error, storage old row is NULL", K(ret)); } else if (storage_old_row->get_count() != old_row.get_count()) { ret = OB_ERR_DEFENSIVE_CHECK; FLOG_WARN("storage old row is not matched with sql old row", K(ret)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < old_row.get_count(); ++i) { const ObObj &storage_val = storage_old_row->get_cell(i); const ObObj &sql_val = old_row.get_cell(i); int cmp = 0; if (sql_val.is_lob_storage()) { // skip all text and lob } else if (OB_UNLIKELY(ObLongTextType == storage_val.get_type() && sql_val.is_lob_locator())) { //skip check lob column type when do the normal sql write check } else if (OB_UNLIKELY(storage_val.is_nop_value())) { bool is_nop = false; if (OB_FAIL(data_table.is_nop_default_value(column_ids.at(i), is_nop))) { LOG_WARN("check column whether has nop default value failed", K(ret), K(column_ids.at(i))); } else if (!is_nop) { err_col_id = column_ids.at(i); ret = OB_ERR_DEFENSIVE_CHECK; FLOG_WARN("storage old row is not matched with sql old row", K(ret), K(i), K(column_ids.at(i)), K(storage_val), K(sql_val)); } } else if (sql_val.is_nop_value()) { //this column is nop val, means that this column does not be touched by DML //just ignore it } else if (OB_FAIL(storage_val.compare(sql_val, cmp)) || 0 != cmp) { ret = OB_ERR_DEFENSIVE_CHECK; err_col_id = column_ids.at(i); FLOG_WARN("storage_val is not equal with sql_val, maybe catch a bug", K(ret), K(storage_val), K(sql_val), K(cmp), K(column_ids.at(i))); } } } if (OB_ERR_DEFENSIVE_CHECK == ret && dml_param.is_batch_stmt_) { // 批量删除的时候可能索引表的删除在主表前边,所以所有的表在batch删除的时候出现4377,都可能是重复删导致的 ret = OB_BATCHED_MULTI_STMT_ROLLBACK; LOG_TRACE("batch stmt execution has a correctness error, needs rollback", K(ret), "column_id", column_ids, KPC(storage_old_row), "sql_old_row", old_row, "dml_param", run_ctx.dml_param_, "dml_type", run_ctx.dml_flag_); } if (OB_ERR_DEFENSIVE_CHECK == ret) { int tmp_ret = OB_SUCCESS; bool is_virtual_gen_col = false; if (OB_TMP_FAIL(check_real_leader_for_4377_(run_ctx.store_ctx_.ls_id_))) { ret = tmp_ret; LOG_WARN("check real leader for 4377 found exception", K(ret), K(old_row), K(data_table)); } else if (nullptr != run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_ && OB_TMP_FAIL(check_need_rollback_in_transfer_for_4377_(run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_, data_tablet_handle))) { ret = tmp_ret; LOG_WARN("check need rollback in transfer for 4377 found exception", K(ret), K(old_row), K(data_table)); } else if (OB_TMP_FAIL(check_parts_tx_state_in_transfer_for_4377_(run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_))) { ret = tmp_ret; LOG_WARN("check need rollback in transfer for 4377 found exception", K(ret), K(old_row), K(data_table)); } else if (is_udf) { ret = OB_ERR_INDEX_KEY_NOT_FOUND; LOG_WARN("index key not found on udf column", K(ret), K(old_row)); } else if (data_table.is_index_table() && OB_TMP_FAIL(check_is_gencol_check_failed(data_table, err_col_id, is_virtual_gen_col))) { //don't change ret if gencol check failed LOG_WARN("check is functional index failed", K(ret), K(tmp_ret), K(data_table)); } else if (is_virtual_gen_col) { ret = OB_ERR_GENCOL_LEGIT_CHECK_FAILED; LOG_WARN("Legitimacy check failed for functional index.", K(ret), K(old_row), KPC(storage_old_row)); } if (OB_ERR_DEFENSIVE_CHECK == ret) { ObString func_name = ObString::make_string("check_old_row_legitimacy"); LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr()); LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret), "column_id", column_ids, KPC(storage_old_row), "sql_old_row", old_row, "dml_param", run_ctx.dml_param_, "dml_flag", run_ctx.dml_flag_, "store_ctx", run_ctx.store_ctx_, "relative_table", run_ctx.relative_table_); LOG_ERROR("Dump data table info", K(ret), K(data_table)); run_ctx.store_ctx_.force_print_trace_log(); } } } return ret; } int ObLSTabletService::check_is_gencol_check_failed(const ObRelativeTable &data_table, uint64_t error_col_id, bool &is_virtual_gen_col) { int ret = OB_SUCCESS; is_virtual_gen_col = false; if (data_table.is_index_table()) { const ObColumnParam *param = nullptr; const uint64_t tenant_id = MTL_ID(); uint64_t index_table_id = data_table.get_table_id(); const ObTableSchema *index_table_schema = NULL; const ObTableSchema *data_table_schema = NULL; ObMultiVersionSchemaService *schema_service = MTL(ObTenantSchemaService*)->get_schema_service(); ObSchemaGetterGuard schema_guard; if (OB_ISNULL(schema_service)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected null", K(ret), KP(schema_service)); } else if (OB_FAIL(schema_service->get_tenant_schema_guard(tenant_id, schema_guard))) { LOG_WARN("failed to get schema manager", K(ret), K(tenant_id)); } else if (OB_FAIL(schema_guard.get_table_schema(tenant_id, index_table_id, index_table_schema))) { LOG_WARN("get index table schema failed", K(ret)); } else if (OB_ISNULL(index_table_schema)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("index table schema is unexpected null", K(ret)); } else if (OB_FAIL(schema_guard.get_table_schema(tenant_id, index_table_schema->get_data_table_id(), data_table_schema))) { LOG_WARN("get data table schema failed", K(ret)); } else if (OB_ISNULL(data_table_schema)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("data table schema is unexpected null", K(ret)); } else if (OB_INVALID_ID != error_col_id) { //check specified column const ObColumnSchemaV2 *column = NULL; if (is_shadow_column(error_col_id)) { //shadow column does not exists in basic table, do nothing } else if (OB_ISNULL(column = data_table_schema->get_column_schema(error_col_id))) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected null", K(ret), KP(column)); } else if (column->is_virtual_generated_column()) { is_virtual_gen_col = true; } } else { //check all columns for (ObTableSchema::const_column_iterator iter = index_table_schema->column_begin(); OB_SUCC(ret) && iter != index_table_schema->column_end() && !is_virtual_gen_col; iter++) { const ObColumnSchemaV2 *column = *iter; //the column id in the data table is the same with that in the index table if (OB_ISNULL(column)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected null", K(ret), KP(column)); } else if (is_shadow_column(column->get_column_id())) { //shadow column does not exists in basic table, do nothing } else if (OB_ISNULL(column = data_table_schema->get_column_schema(column->get_column_id()))) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected null", K(ret), KP(column)); } else if (column->is_virtual_generated_column()) { is_virtual_gen_col = true; } } } } return ret; } int ObLSTabletService::check_new_row_legitimacy( ObDMLRunningCtx &run_ctx, const common::ObNewRow &new_row) { int ret = OB_SUCCESS; ObRelativeTable &data_table = run_ctx.relative_table_; int64_t data_table_cnt = data_table.get_column_count(); if (OB_ISNULL(run_ctx.column_ids_)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("column ids is nullptr", K(ret)); } else if (OB_FAIL(check_new_row_nullable_value(*run_ctx.column_ids_, data_table, new_row))) { LOG_WARN("check new row nullable value failed", K(ret), "dml_param", run_ctx.dml_param_, "dml_type", run_ctx.dml_flag_); } else if (OB_FAIL(check_new_row_shadow_pk(*run_ctx.column_ids_, data_table, new_row))) { LOG_WARN("check new row nullable value failed", K(ret), "dml_param", run_ctx.dml_param_, "dml_type", run_ctx.dml_flag_); } return ret; } int ObLSTabletService::insert_rows_to_tablet( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, const ObNewRow * const rows, const int64_t row_count, ObRowsInfo &rows_info, ObStoreRow *tbl_rows, int64_t &afct_num, int64_t &dup_num) { int ret = OB_SUCCESS; ObStoreCtx &ctx = run_ctx.store_ctx_; const ObDMLBaseParam &dml_param = run_ctx.dml_param_; ObRelativeTable &data_table = run_ctx.relative_table_; if (OB_FAIL(ret)) { } else if (ObClockGenerator::getClock() > dml_param.timeout_) { ret = OB_TIMEOUT; int64_t cur_time = ObClockGenerator::getClock(); LOG_WARN("query timeout", K(cur_time), K(dml_param), K(ret)); } else if (OB_FAIL(construct_table_rows(rows, tbl_rows, row_count))) { LOG_WARN("fail to construct table rows", K(ret)); } else if (OB_FAIL(rows_info.check_duplicate(tbl_rows, row_count, data_table))) { if (OB_ERR_PRIMARY_KEY_DUPLICATE == ret) { char rowkey_buffer[OB_TMP_BUF_SIZE_256]; if (OB_SUCCESS != extract_rowkey(data_table, rows_info.get_duplicate_rowkey(), rowkey_buffer, OB_TMP_BUF_SIZE_256, run_ctx.dml_param_.tz_info_)) { LOG_WARN("extract rowkey failed"); } else { ObString index_name = "PRIMARY"; if (data_table.is_index_table()) { data_table.get_index_name(index_name); } LOG_USER_ERROR(OB_ERR_PRIMARY_KEY_DUPLICATE, rowkey_buffer, index_name.length(), index_name.ptr()); } } else { LOG_WARN("fail to check duplicate", K(ret)); } } else if (OB_FAIL(insert_lob_tablet_rows(tablet_handle, run_ctx, tbl_rows, row_count))) { LOG_WARN("failed to insert rows to lob tablet", K(ret)); } else if (OB_FAIL(insert_tablet_rows(row_count, tablet_handle, run_ctx, tbl_rows, rows_info))) { LOG_WARN("failed to insert rows to data tablet", K(ret)); } else { afct_num = afct_num + row_count; } return ret; } int ObLSTabletService::insert_tablet_rows( const int64_t row_count, ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, ObStoreRow *rows, ObRowsInfo &rows_info) { int ret = OB_SUCCESS; ObRelativeTable &table = run_ctx.relative_table_; const bool check_exists = !table.is_storage_index_table() || table.is_unique_index(); bool exists = false; // 1. Defensive checking of new rows. if (GCONF.enable_defensive_check()) { for (int64_t i = 0; OB_SUCC(ret) && i < row_count; i++) { ObStoreRow &tbl_row = rows[i]; if (OB_FAIL(check_new_row_legitimacy(run_ctx, tbl_row.row_val_))) { LOG_WARN("Failed to check new row legitimacy", K(ret), K_(tbl_row.row_val)); } } } // 2. Check uniqueness constraint in memetable only(active + frozen). // It would be more efficient and elegant to completely merge the uniqueness constraint // and write conflict checking, but the implementation currently is to minimize intrusion // into the memtable. if (check_exists && OB_FAIL(tablet_handle.get_obj()->rowkeys_exists(run_ctx.store_ctx_, table, rows_info, exists))) { LOG_WARN("Failed to check the uniqueness constraint", K(ret), K(rows_info)); } else if (exists) { ret = OB_ERR_PRIMARY_KEY_DUPLICATE; blocksstable::ObDatumRowkey &duplicate_rowkey = rows_info.get_conflict_rowkey(); LOG_WARN("Rowkey already exist", K(ret), K(table), K(duplicate_rowkey)); } // 3. Insert rows with uniqueness constraint and write conflict checking. // Check write conflict in memtable + sstable. // Check uniqueness constraint in sstable only. if (OB_SUCC(ret)) { if (OB_FAIL(tablet_handle.get_obj()->insert_rows(table, run_ctx.store_ctx_, rows, rows_info, check_exists, *run_ctx.col_descs_, row_count, run_ctx.dml_param_.encrypt_meta_))) { if (OB_ERR_PRIMARY_KEY_DUPLICATE == ret) { blocksstable::ObDatumRowkey &duplicate_rowkey = rows_info.get_conflict_rowkey(); LOG_WARN("Rowkey already exist", K(ret), K(table), K(duplicate_rowkey), K(rows_info.get_conflict_idx())); } else if (OB_TRY_LOCK_ROW_CONFLICT != ret) { LOG_WARN("Failed to insert rows to tablet", K(ret), K(rows_info)); } } } // 4. Log user error message if rowkey is duplicate. if (OB_ERR_PRIMARY_KEY_DUPLICATE == ret && !run_ctx.dml_param_.is_ignore_) { int tmp_ret = OB_SUCCESS; char rowkey_buffer[OB_TMP_BUF_SIZE_256]; ObString index_name = "PRIMARY"; if (OB_TMP_FAIL(extract_rowkey(table, rows_info.get_conflict_rowkey(), rowkey_buffer, OB_TMP_BUF_SIZE_256, run_ctx.dml_param_.tz_info_))) { LOG_WARN("Failed to extract rowkey", K(ret), K(tmp_ret)); } if (table.is_index_table()) { if (OB_TMP_FAIL(table.get_index_name(index_name))) { LOG_WARN("Failed to get index name", K(ret), K(tmp_ret)); } } else if (lib::is_oracle_mode() && OB_TMP_FAIL(table.get_primary_key_name(index_name))) { LOG_WARN("Failed to get pk name", K(ret), K(tmp_ret)); } LOG_USER_ERROR(OB_ERR_PRIMARY_KEY_DUPLICATE, rowkey_buffer, index_name.length(), index_name.ptr()); } return ret; } int ObLSTabletService::insert_lob_col( ObDMLRunningCtx &run_ctx, const ObColDesc &column, ObObj &obj, ObLobAccessParam *del_param, ObLobCommon *lob_common) { int ret = OB_SUCCESS; uint64_t lob_id; ObLobManager *lob_mngr = MTL(ObLobManager*); if (OB_ISNULL(lob_mngr)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret)); } else if (!column.col_type_.is_lob_storage() || obj.is_nop_value() || obj.is_null()) { // do nothing } else { // init lob access param ObLobAccessParam lob_param; lob_param.tx_desc_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_; lob_param.parent_seq_no_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_scn_; lob_param.snapshot_ = run_ctx.dml_param_.snapshot_; lob_param.is_total_quantity_log_ = run_ctx.dml_param_.is_total_quantity_log_; if (lob_param.snapshot_.is_none_read()) { // NOTE: // lob_insert need table_scan, the snapshot already generated in // run_ctx.store_ctx, use it as an LS ReadSnapshot lob_param.snapshot_.init_ls_read(run_ctx.store_ctx_.ls_id_, run_ctx.store_ctx_.mvcc_acc_ctx_.snapshot_); } lob_param.tx_id_ = lob_param.tx_desc_->get_tx_id(); lob_param.sql_mode_ = run_ctx.dml_param_.sql_mode_; lob_param.ls_id_ = run_ctx.store_ctx_.ls_id_; lob_param.tablet_id_ = run_ctx.relative_table_.get_tablet_id(); lob_param.coll_type_ = column.col_type_.get_collation_type(); lob_param.allocator_ = &run_ctx.lob_allocator_; lob_param.lob_common_ = lob_common; if (OB_NOT_NULL(del_param)) { lob_param.handle_size_ = del_param->handle_size_; lob_param.checksum_ = del_param->checksum_; lob_param.total_seq_cnt_ = del_param->total_seq_cnt_; lob_param.used_seq_cnt_ = del_param->used_seq_cnt_; lob_param.seq_no_st_ = del_param->seq_no_st_; } lob_param.timeout_ = run_ctx.dml_param_.timeout_; lob_param.scan_backward_ = false; lob_param.offset_ = 0; // Notice: currently only inrow data ObString raw_data = obj.get_string(); ObString data; // for not strict sql mode, will insert empty string without lob header bool has_lob_header = obj.has_lob_header() && raw_data.length() > 0; ObLobLocatorV2 loc(raw_data, has_lob_header); if (OB_FAIL(lob_mngr->append(lob_param, loc))) { LOG_WARN("[STORAGE_LOB]lob append failed.", K(ret)); } else { ObLobCommon *res_lob_common = lob_param.lob_common_; obj.set_lob_value(obj.get_type(), res_lob_common, lob_param.handle_size_); LOG_DEBUG("[STORAGE_LOB]write ob lob data.", K(lob_param), KPC(res_lob_common), K(lob_param.handle_size_), K(column.col_type_.get_collation_type())); } } return ret; } int ObLSTabletService::check_lob_tablet_valid(ObTabletHandle &data_tablet) { int ret = OB_SUCCESS; bool is_valid_aux_lob_table = false; ObTabletBindingMdsUserData ddl_data; if (OB_FAIL(data_tablet.get_obj()->ObITabletMdsInterface::get_ddl_data(share::SCN::max_scn(), ddl_data))) { LOG_WARN("failed to get ddl data from tablet", K(ret), K(data_tablet)); } else { is_valid_aux_lob_table = ddl_data.lob_meta_tablet_id_.is_valid() && ddl_data.lob_piece_tablet_id_.is_valid(); if (!is_valid_aux_lob_table) { ret = OB_ERR_UNEXPECTED; LOG_WARN("aux lob table must valid when lob column exist", K(ret), K(ddl_data)); } } return ret; } int ObLSTabletService::insert_lob_tablet_row( ObTabletHandle &data_tablet, ObDMLRunningCtx &run_ctx, ObStoreRow &row) { int ret = OB_SUCCESS; int64_t col_cnt = run_ctx.col_descs_->count(); ObLobManager *lob_mngr = MTL(ObLobManager*); bool check_lob = false; if (OB_ISNULL(lob_mngr)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret)); } else if (row.row_val_.count_ != col_cnt) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]column count invalid", K(ret), K(col_cnt), K(row.row_val_.count_)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) { const ObColDesc &column = run_ctx.col_descs_->at(i); ObObj &obj = row.row_val_.get_cell(i); if (obj.is_null() || obj.is_nop_value()) { // do nothing } else if (column.col_type_.is_lob_storage()) { if (!check_lob) { if (OB_FAIL(check_lob_tablet_valid(data_tablet))) { LOG_WARN("failed to check_lob_tablet_valid", K(ret), K(data_tablet)); } else { check_lob = true; } } if (OB_FAIL(ret)) { } else if(OB_FAIL(insert_lob_col(run_ctx, column, obj, nullptr, nullptr))) { LOG_WARN("[STORAGE_LOB]failed to insert lob col.", K(ret), K(row), K(i)); } } } } return ret; } int ObLSTabletService::insert_lob_tablet_rows( ObTabletHandle &data_tablet, ObDMLRunningCtx &run_ctx, ObStoreRow *rows, int64_t row_count) { int ret = OB_SUCCESS; // DEBUG_SYNC(DELAY_INDEX_WRITE); ObLobManager *lob_mngr = MTL(ObLobManager*); if (OB_ISNULL(lob_mngr)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret)); } else { int64_t col_cnt = run_ctx.col_descs_->count(); for (int64_t k = 0; OB_SUCC(ret) && k < row_count; k++) { if (OB_FAIL(insert_lob_tablet_row(data_tablet, run_ctx, rows[k]))) { LOG_WARN("[STORAGE_LOB]failed to insert lob row.", K(ret)); } } } return ret; } int ObLSTabletService::extract_rowkey( const ObRelativeTable &table, const blocksstable::ObDatumRowkey &rowkey, char *buffer, const int64_t buffer_len, const ObTimeZoneInfo *tz_info) { int ret = OB_SUCCESS; common::ObSEArray rowkey_cols; ObStoreRowkey store_rowkey; ObDatumRowkeyHelper rowkey_helper; if (OB_FAIL(table.get_rowkey_column_ids(rowkey_cols))) { STORAGE_LOG(WARN, "Failed to get rowkey cols", K(ret), K(table)); } else if (OB_FAIL(rowkey_helper.convert_store_rowkey(rowkey, rowkey_cols, store_rowkey))) { STORAGE_LOG(WARN, "Failed to convert store rowkey", K(ret), K(rowkey)); } else { ret = extract_rowkey(table, store_rowkey, buffer, buffer_len, tz_info); } return ret; } int ObLSTabletService::extract_rowkey( const ObRelativeTable &table, const common::ObStoreRowkey &rowkey, char *buffer, const int64_t buffer_len, const ObTimeZoneInfo *tz_info) { int ret = OB_SUCCESS; if (!table.is_valid() || !rowkey.is_valid() || OB_ISNULL(buffer) || buffer_len <= 0) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(table), K(rowkey), K(buffer), K(buffer_len), K(tz_info)); } else { const int64_t rowkey_size = table.get_rowkey_column_num(); int64_t pos = 0; int64_t valid_rowkey_size = 0; uint64_t column_id = OB_INVALID_ID; for (int64_t i = 0; OB_SUCC(ret) && i < rowkey_size; i++) { if (OB_FAIL(table.get_rowkey_col_id_by_idx(i, column_id))) { ret = OB_ERR_UNEXPECTED; LOG_WARN("Failed to get rowkey column description", K(i), K(ret)); } else if (column_id <= OB_MIN_SHADOW_COLUMN_ID) { valid_rowkey_size ++; } } for (int64_t i = 0; OB_SUCC(ret) && i < valid_rowkey_size; ++i) { const ObObj &obj = rowkey.get_obj_ptr()[i]; if (OB_FAIL(obj.print_plain_str_literal(buffer, buffer_len - 1, pos, tz_info))) { LOG_WARN("fail to print_plain_str_literal", K(ret)); } else if (i < valid_rowkey_size - 1) { if (OB_FAIL(databuff_printf(buffer, buffer_len - 1, pos, "-"))) { LOG_WARN("databuff print failed", K(ret)); } } } if (buffer != nullptr) { buffer[pos++] = '\0'; } } return ret; } int ObLSTabletService::get_next_rows( ObNewRowIterator *row_iter, ObNewRow *&rows, int64_t &row_count) { return row_iter->get_next_rows(rows, row_count); } int ObLSTabletService::construct_update_idx( const int64_t schema_rowkey_cnt, const share::schema::ColumnMap *col_map, const common::ObIArray &upd_col_ids, UpdateIndexArray &update_idx) { int ret = OB_SUCCESS; int err = OB_SUCCESS; if (OB_ISNULL(col_map) || upd_col_ids.count() <= 0 || update_idx.count() > 0 || schema_rowkey_cnt <= 0) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(col_map), K(upd_col_ids), K(upd_col_ids.count()), K(schema_rowkey_cnt)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < upd_col_ids.count(); ++i) { int32_t idx = -1; const uint64_t &col_id = upd_col_ids.at(i); if (OB_SUCCESS != (err = col_map->get(col_id, idx)) || idx < 0) { ret = OB_ERR_UNEXPECTED; LOG_WARN("column id doesn't exist", K(ret), K(col_id), K(err)); } else if (idx < schema_rowkey_cnt) { // update_idx should not contain rowkey } else if (OB_FAIL(update_idx.push_back(idx))) { LOG_WARN("fail to push idx into update_idx", K(ret), K(idx)); } } if (OB_SUCC(ret) && update_idx.count() > 1) { std::sort(update_idx.begin(), update_idx.end()); } } return ret; } int ObLSTabletService::check_rowkey_change( const ObIArray &update_ids, const ObRelativeTable &relative_table, bool &rowkey_change, bool &delay_new) { int ret = OB_SUCCESS; if (OB_UNLIKELY(update_ids.count() <= 0 || !relative_table.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(update_ids), K(ret)); } else { const int64_t count = update_ids.count(); bool is_rowkey = false; rowkey_change = false; delay_new = false; for (int64_t i = 0; OB_SUCC(ret) && i < count && !rowkey_change; ++i) { if (OB_FAIL(relative_table.is_rowkey_column_id(update_ids.at(i), is_rowkey))) { LOG_WARN("check is_rowkey fail", K(ret), K(update_ids.at(i))); } else { rowkey_change = is_rowkey; } } if (OB_FAIL(ret)) { // do nothing } else if (relative_table.is_unique_index() && !rowkey_change) { uint64_t cid = OB_INVALID_ID; bool innullable = true; for (int64_t j = 0; OB_SUCC(ret) && j < relative_table.get_rowkey_column_num() && !rowkey_change; ++j) { if (OB_FAIL(relative_table.get_rowkey_col_id_by_idx(j, cid))) { LOG_WARN("get rowkey column id fail", K(ret), K(j)); } else if (cid > OB_MIN_SHADOW_COLUMN_ID) { if (innullable) { break; // other_change } else { cid -= OB_MIN_SHADOW_COLUMN_ID; for (int64_t k = 0; OB_SUCC(ret) && k < count; ++k) { if (cid == update_ids.at(k)) { rowkey_change = true; break; } } } } else { bool is_nullable = false; if (OB_FAIL(relative_table.is_column_nullable_for_write(cid, is_nullable))) { LOG_WARN("check nullable fail", K(ret), K(cid), K(relative_table)); } else if (is_nullable) { innullable = false; } } } } if (OB_SUCC(ret) && rowkey_change) { delay_new = true; } LOG_DEBUG("check rowkey change for update", K(rowkey_change), K(delay_new), K(update_ids), K(relative_table)); } return ret; } int ObLSTabletService::check_rowkey_value_change( const common::ObNewRow &old_row, const common::ObNewRow &new_row, const int64_t rowkey_len, bool &rowkey_change) { int ret = OB_SUCCESS; if (OB_UNLIKELY(rowkey_len <= 0) || OB_UNLIKELY(old_row.count_ < rowkey_len) || OB_UNLIKELY(new_row.count_ < rowkey_len)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(old_row), K(new_row), K(rowkey_len), K(ret)); } else { rowkey_change = false; for (int64_t i = 0; !rowkey_change && i < rowkey_len; ++i) { if (old_row.cells_[i] != new_row.cells_[i]) { rowkey_change = true; } } } LOG_DEBUG("check rowkey value for update", K(rowkey_change), K(old_row), K(new_row)); return ret; } int ObLSTabletService::process_delta_lob( ObDMLRunningCtx &run_ctx, const ObColDesc &column, ObObj &old_obj, ObLobLocatorV2 &delta_lob, ObObj &obj) { int ret = OB_SUCCESS; ObLobManager *lob_mngr = MTL(ObLobManager*); if (OB_ISNULL(lob_mngr)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]failed to get lob manager handle.", K(ret)); } else if (!delta_lob.is_delta_temp_lob()) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB] invalid lob type", K(ret), K(delta_lob)); } else { ObLobAccessParam lob_param; // init lob param lob_param.tx_desc_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_; lob_param.parent_seq_no_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_scn_; lob_param.snapshot_ = run_ctx.dml_param_.snapshot_; if (lob_param.snapshot_.is_none_read()) { // NOTE: // lob_insert need table_scan, the snapshot already generated in // run_ctx.store_ctx, use it as an LS ReadSnapshot lob_param.snapshot_.init_ls_read(run_ctx.store_ctx_.ls_id_, run_ctx.store_ctx_.mvcc_acc_ctx_.snapshot_); } lob_param.tx_id_ = lob_param.tx_desc_->get_tx_id(); lob_param.sql_mode_ = run_ctx.dml_param_.sql_mode_; lob_param.ls_id_ = run_ctx.store_ctx_.ls_id_; lob_param.tablet_id_ = run_ctx.relative_table_.get_tablet_id(); lob_param.coll_type_ = column.col_type_.get_collation_type(); lob_param.allocator_ = &run_ctx.lob_allocator_; // should use old obj lob ObLobLocatorV2 old_lob; ObString old_disk_lob; if (OB_FAIL(old_obj.get_lob_locatorv2(old_lob))) { LOG_WARN("get old lob locator failed.", K(ret), K(old_obj)); } else if (!old_lob.is_valid()) { ret = OB_ERR_UNEXPECTED; LOG_WARN("old lob locator is invalid.", K(ret)); } else if (OB_FAIL(old_lob.get_disk_locator(old_disk_lob))) { LOG_WARN("fail to get old lob disk locator.", K(ret)); } else { lob_param.lob_locator_ = nullptr; lob_param.lob_common_ = reinterpret_cast(old_disk_lob.ptr()); lob_param.handle_size_ = old_disk_lob.length(); lob_param.byte_size_ = lob_param.lob_common_->get_byte_size(lob_param.handle_size_); lob_param.timeout_ = run_ctx.dml_param_.timeout_; lob_param.scan_backward_ = false; if (OB_FAIL(lob_mngr->process_delta(lob_param, delta_lob))) { LOG_WARN("failed to process delta lob.", K(ret), K(lob_param), K(delta_lob)); } else { // update obj with new disk locator obj.set_lob_value(obj.get_type(), lob_param.lob_common_, lob_param.handle_size_); } } } return ret; } int ObLSTabletService::process_lob_row( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, const ObIArray &update_idx, bool data_tbl_rowkey_change, ObStoreRow &old_sql_row, ObStoreRow &old_row, ObStoreRow &new_row) { int ret = OB_SUCCESS; bool check_lob = false; if (OB_UNLIKELY(old_row.row_val_.get_count() != new_row.row_val_.get_count())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("[STORAGE_LOB]invalid args", K(old_row), K(new_row), K(ret)); } else if (OB_UNLIKELY(old_row.row_val_.get_count() != run_ctx.col_descs_->count())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("[STORAGE_LOB]invalid args", K(old_row), K(new_row), KPC(run_ctx.col_descs_)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < old_row.row_val_.get_count(); ++i) { if (run_ctx.col_descs_->at(i).col_type_.is_lob_storage()) { ObObj &old_obj = old_row.row_val_.get_cell(i); ObObj &old_sql_obj = old_sql_row.row_val_.get_cell(i); ObObj &new_obj = new_row.row_val_.get_cell(i); bool is_update = false; for (int64_t j = 0; !is_update && j < update_idx.count(); ++j) { if (update_idx.at(j) == i) { is_update = true; } } if (is_update) { if (!check_lob) { if (OB_FAIL(check_lob_tablet_valid(tablet_handle))) { LOG_WARN("failed to check_lob_tablet_valid", K(ret), K(tablet_handle)); } else { check_lob = true; } } // get new lob locator ObString new_lob_str = (new_obj.is_null() || new_obj.is_nop_value()) ? ObString(0, nullptr) : new_obj.get_string(); ObLobLocatorV2 new_lob(new_lob_str, new_obj.has_lob_header()); if (OB_FAIL(ret)) { } else if (new_obj.is_null() || new_obj.is_nop_value() || new_lob.is_full_temp_lob() || new_lob.is_persist_lob() || (new_lob.is_lob_disk_locator() && new_lob.has_inrow_data())) { ObLobCommon *lob_common = nullptr; ObLobAccessParam lob_param; if (OB_FAIL(new_lob.get_lob_data_byte_len(lob_param.update_len_))) { LOG_WARN("fail to get new lob byte len", K(ret), K(new_lob), K(i)); } else if (OB_FAIL(delete_lob_col(run_ctx, run_ctx.col_descs_->at(i), old_obj, old_sql_obj, lob_common, lob_param))) { LOG_WARN("[STORAGE_LOB]failed to erase old lob col", K(ret), K(old_sql_row), K(old_row), K(i)); } else if (OB_FAIL(insert_lob_col(run_ctx, run_ctx.col_descs_->at(i), new_obj, &lob_param, lob_common))) { LOG_WARN("[STORAGE_LOB]failed to insert new lob col.", K(ret), K(new_row), K(i)); } } else if (new_lob.is_delta_temp_lob()) { if (OB_FAIL(process_delta_lob(run_ctx, run_ctx.col_descs_->at(i), old_sql_obj, new_lob, new_obj))) { LOG_WARN("failed to process delta lob.", K(ret), K(i)); } } else { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected obj for new lob", K(ret), K(i), K(new_obj), K(new_lob)); } } else { if (old_obj.is_null()) { new_obj.set_null(); } else if (old_obj.is_nop_value()) { new_obj.set_nop_value(); } else if (new_obj.is_nop_value() || new_obj.is_null()) { // do nothing } else { if (old_obj.is_null()) { new_obj.set_null(); } else if (old_obj.is_nop_value()) { new_obj.set_nop_value(); } else { ObString val_str = old_obj.get_string(); ObLobCommon *lob_common = reinterpret_cast(val_str.ptr()); if (!lob_common->in_row_ && data_tbl_rowkey_change) { ObLobAccessParam lob_param; if (val_str.length() < ObLobManager::LOB_WITH_OUTROW_CTX_SIZE) { ret = OB_ERR_UNEXPECTED; LOG_WARN("not enough space for lob header", K(ret), K(val_str), K(i)); } else if (OB_FAIL(delete_lob_col(run_ctx, run_ctx.col_descs_->at(i), old_obj, old_sql_obj, lob_common, lob_param))) { LOG_WARN("[STORAGE_LOB]failed to erase old lob col", K(ret), K(old_sql_row), K(old_row), K(i)); } else if (OB_FAIL(insert_lob_col(run_ctx, run_ctx.col_descs_->at(i), new_obj, nullptr, nullptr))) { // no need del_param LOG_WARN("[STORAGE_LOB]failed to insert new lob col.", K(ret), K(new_row), K(i)); } } else { new_obj.set_lob_value(new_obj.get_type(), val_str.ptr(), val_str.length()); // remove has lob header flag } } } } } } } return ret; } int ObLSTabletService::update_row_to_tablet( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, const bool rowkey_change, const ObIArray &update_idx, const bool delay_new, const bool lob_update, ObStoreRow &old_tbl_row, ObStoreRow &new_tbl_row, ObRowStore *row_store, bool &duplicate) { int ret = OB_SUCCESS; const ObDMLBaseParam &dml_param = run_ctx.dml_param_; const ObColDescIArray &col_descs = *run_ctx.col_descs_; bool data_tbl_rowkey_change = false; int64_t data_tbl_rowkey_len = run_ctx.relative_table_.get_rowkey_column_num(); ObSQLMode sql_mode = dml_param.sql_mode_; duplicate = false; ObStoreRow old_sql_tbl_row; old_sql_tbl_row.row_val_ = old_tbl_row.row_val_; if (OB_UNLIKELY(col_descs.count() != old_tbl_row.row_val_.get_count() || col_descs.count() != new_tbl_row.row_val_.get_count())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(col_descs.count()), K(old_tbl_row.row_val_), K(new_tbl_row.row_val_)); } else if (rowkey_change && OB_FAIL(check_rowkey_value_change(old_tbl_row.row_val_, new_tbl_row.row_val_, data_tbl_rowkey_len, data_tbl_rowkey_change))) { LOG_WARN("failed to check data table rowkey change", K(ret), K(old_tbl_row), K(new_tbl_row), K(data_tbl_rowkey_len)); } else if (OB_FAIL(process_old_row(tablet_handle, run_ctx, data_tbl_rowkey_change, lob_update, old_tbl_row))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("fail to process old row", K(ret), K(*run_ctx.col_descs_), K(old_tbl_row), K(data_tbl_rowkey_change)); } } else if (OB_FAIL(process_lob_row(tablet_handle, run_ctx, update_idx, data_tbl_rowkey_change, old_sql_tbl_row, old_tbl_row, new_tbl_row))) { LOG_WARN("failed to process lob col change", K(ret), K(old_tbl_row), K(new_tbl_row)); } else if (delay_new && lib::is_oracle_mode()) { // if total quantity log is needed, we should cache both new row and old row, // and the sequence is new_row1, old_row1, new_row2, old_row2...., // if total quantity log isn't needed, just cache new row if (OB_ISNULL(row_store)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("row_store is NULL", K(ret)); } else if (OB_FAIL(row_store->add_row(new_tbl_row.row_val_))) { LOG_WARN("failed to store new row", K(new_tbl_row), K(ret)); } else if (OB_FAIL(row_store->add_row(old_tbl_row.row_val_))) { LOG_WARN("failed to store old row", K(old_tbl_row), K(ret)); } else { LOG_DEBUG("add row store for delay new", K(old_tbl_row), K(new_tbl_row)); } } else if (OB_FAIL(process_new_row(tablet_handle, run_ctx, update_idx, old_tbl_row, new_tbl_row, data_tbl_rowkey_change))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("fail to process new row", K(new_tbl_row), K(ret)); } } return ret; } int ObLSTabletService::process_old_row( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, const bool data_tbl_rowkey_change, const bool lob_update, ObStoreRow &tbl_row) { int ret = OB_SUCCESS; ObStoreCtx &store_ctx = run_ctx.store_ctx_; ObRelativeTable &relative_table = run_ctx.relative_table_; bool is_delete_total_quantity_log = run_ctx.dml_param_.is_total_quantity_log_; if (OB_UNLIKELY(!relative_table.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid relative tables", K(ret), K(relative_table)); } else if (OB_UNLIKELY(!store_ctx.is_valid() || nullptr == run_ctx.col_descs_ || run_ctx.col_descs_->count() <= 0 || !tbl_row.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(store_ctx), KP(run_ctx.col_descs_), K(tbl_row), K(is_delete_total_quantity_log)); } else if (OB_FAIL(check_old_row_legitimacy(tablet_handle, run_ctx, tbl_row.row_val_))) { if (OB_ERR_DEFENSIVE_CHECK == ret) { dump_diag_info_for_old_row_loss(relative_table, store_ctx, tbl_row); } LOG_WARN("check old row legitimacy failed", K(tbl_row.row_val_)); } else if (OB_FAIL(process_old_row_lob_col(tablet_handle, run_ctx, tbl_row))){ LOG_WARN("failed to process old row lob col", K(ret), K(tbl_row)); } else { ObColDescIArray &col_descs = const_cast(*run_ctx.col_descs_); const uint64_t &table_id = relative_table.get_table_id(); int64_t rowkey_size = relative_table.get_rowkey_column_num(); ObStoreRowkey store_rowkey; ObDatumRowkey datum_rowkey; ObDatumRowkeyHelper rowkey_helper(run_ctx.allocator_); if (OB_UNLIKELY(run_ctx.dml_param_.prelock_)) { bool locked = false; if (OB_FAIL(store_rowkey.assign(tbl_row.row_val_.cells_, rowkey_size))) { LOG_WARN("Failed to assign rowkey", K(ret), K(tbl_row), K(rowkey_size)); } else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(store_rowkey.get_rowkey(), datum_rowkey))) { STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(store_rowkey), K(rowkey_size), K(tbl_row)); } else if (OB_FAIL(check_row_locked_by_myself(tablet_handle, relative_table, store_ctx, datum_rowkey, locked))) { LOG_WARN("fail to check row locked", K(ret), K(tbl_row)); } else if (!locked) { ret = OB_ERR_ROW_NOT_LOCKED; LOG_DEBUG("row has not been locked", K(ret), K(tbl_row)); } } if (OB_FAIL(ret)) { } else if (data_tbl_rowkey_change) { ObStoreRow del_row(tbl_row); del_row.flag_.set_flag(ObDmlFlag::DF_DELETE); if (!is_delete_total_quantity_log) { if (OB_FAIL(tablet_handle.get_obj()->insert_row_without_rowkey_check(relative_table, run_ctx.store_ctx_, col_descs, del_row, run_ctx.dml_param_.encrypt_meta_))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("failed to write data tablet row", K(ret), K(del_row)); } } } else { ObStoreRow new_tbl_row; new_tbl_row.flag_.set_flag(ObDmlFlag::DF_DELETE); new_tbl_row.row_val_ = tbl_row.row_val_; del_row.flag_.set_flag(ObDmlFlag::DF_UPDATE); ObSEArray update_idx; if (OB_FAIL(tablet_handle.get_obj()->update_row(relative_table, run_ctx.store_ctx_, col_descs, update_idx, del_row, new_tbl_row, run_ctx.dml_param_.encrypt_meta_))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("failed to write data tablet row", K(ret), K(del_row), K(new_tbl_row)); } } } } else if (lob_update) { // need to lock main table rows that don't need to be deleted if (OB_FAIL(store_rowkey.assign(tbl_row.row_val_.cells_, rowkey_size))) { LOG_WARN("Failed to assign rowkey", K(ret), K(tbl_row), K(rowkey_size)); } else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(store_rowkey.get_rowkey(), datum_rowkey))) { STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(store_rowkey)); } else if (OB_FAIL(tablet_handle.get_obj()->lock_row(relative_table, store_ctx, datum_rowkey))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("lock row failed", K(ret), K(table_id), K(tbl_row), K(rowkey_size)); } } LOG_DEBUG("generate lock node before update lob columns", K(ret), K(table_id), K(tbl_row)); } } return ret; } int ObLSTabletService::process_new_row( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, const common::ObIArray &update_idx, const ObStoreRow &old_tbl_row, const ObStoreRow &new_tbl_row, const bool rowkey_change) { int ret = OB_SUCCESS; if (OB_UNLIKELY(update_idx.count() < 0 || !new_tbl_row.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(update_idx), K(new_tbl_row), K(rowkey_change)); } else if (GCONF.enable_defensive_check() && OB_FAIL(check_new_row_legitimacy(run_ctx, new_tbl_row.row_val_))) { LOG_WARN("check new row legitimacy failed", K(ret), K(new_tbl_row.row_val_)); } else { // write full column clog needs to construct update_idx and pass to memtable if (OB_FAIL(process_data_table_row(tablet_handle, run_ctx, update_idx, old_tbl_row, new_tbl_row, rowkey_change))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("fail to process data table row", K(ret), K(update_idx), K(old_tbl_row), K(new_tbl_row), K(rowkey_change)); } } } return ret; } int ObLSTabletService::process_data_table_row( ObTabletHandle &data_tablet, ObDMLRunningCtx &run_ctx, const ObIArray &update_idx, const ObStoreRow &old_tbl_row, const ObStoreRow &new_tbl_row, const bool rowkey_change) { int ret = OB_SUCCESS; ObStoreCtx &ctx = run_ctx.store_ctx_; ObRelativeTable &relative_table = run_ctx.relative_table_; bool is_update_total_quantity_log = run_ctx.dml_param_.is_total_quantity_log_; const common::ObTimeZoneInfo *tz_info = run_ctx.dml_param_.tz_info_; if (OB_UNLIKELY(!ctx.is_valid() || !relative_table.is_valid() || nullptr == run_ctx.col_descs_ || run_ctx.col_descs_->count() <= 0 || update_idx.count() < 0 || (is_update_total_quantity_log && !old_tbl_row.is_valid()) || !new_tbl_row.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ctx), KP(run_ctx.col_descs_), K(update_idx), K(old_tbl_row), K(new_tbl_row), K(is_update_total_quantity_log), K(rowkey_change)); } else { const ObColDescIArray &col_descs = *run_ctx.col_descs_; bool exists = false; if (rowkey_change && OB_FAIL(data_tablet.get_obj()->rowkey_exists( relative_table, ctx, new_tbl_row.row_val_, exists))) { LOG_WARN("failed to check rowkey exists", K(ret), K(new_tbl_row)); } else if (exists) { char buffer[OB_TMP_BUF_SIZE_256]; ObStoreRowkey rowkey; ret = OB_ERR_PRIMARY_KEY_DUPLICATE; if (OB_SUCCESS != rowkey.assign(new_tbl_row.row_val_.cells_, relative_table.get_rowkey_column_num())) { LOG_WARN("Failed to assign rowkey", K(new_tbl_row)); } else if (OB_SUCCESS != extract_rowkey(relative_table, rowkey, buffer, OB_TMP_BUF_SIZE_256, tz_info)) { LOG_WARN("extract rowkey failed", K(rowkey)); } else { ObString index_name = "PRIMARY"; if (relative_table.is_index_table()) { relative_table.get_index_name(index_name); } LOG_USER_ERROR(OB_ERR_PRIMARY_KEY_DUPLICATE, buffer, index_name.length(), index_name.ptr()); } LOG_WARN("rowkey already exists", K(ret), K(new_tbl_row)); } else { ObStoreRow new_row; new_row.flag_.set_flag(rowkey_change ? ObDmlFlag::DF_INSERT : ObDmlFlag::DF_UPDATE); new_row.row_val_ = new_tbl_row.row_val_; if (is_update_total_quantity_log && !rowkey_change) { ObStoreRow old_row; old_row.flag_.set_flag(ObDmlFlag::DF_UPDATE); old_row.row_val_ = old_tbl_row.row_val_; if (OB_FAIL(data_tablet.get_obj()->update_row(relative_table, ctx, col_descs, update_idx, old_row, new_row, run_ctx.dml_param_.encrypt_meta_))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("failed to update to row", K(ret), K(old_row), K(new_row)); } } } else { if (OB_FAIL(data_tablet.get_obj()->insert_row_without_rowkey_check(relative_table, ctx, col_descs, new_row, run_ctx.dml_param_.encrypt_meta_))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("failed to update to row", K(ret), K(new_row)); } } } } } return ret; } int ObLSTabletService::check_new_row_nullable_value( const ObIArray &column_ids, ObRelativeTable &data_table, const ObNewRow &new_row) { int ret = OB_SUCCESS; if (OB_UNLIKELY(column_ids.count() != new_row.get_count())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("new row is invalid", K(ret), K(new_row.get_count()), K(column_ids.count())); } for (int64_t i = 0; OB_SUCC(ret) && i < column_ids.count(); ++i) { uint64_t column_id = column_ids.at(i); bool is_nullable = false; if (OB_UNLIKELY(is_shadow_column(column_id))) { //the shadow pk is generated internally, //and the nullable attribute check for it is skipped } else if (OB_FAIL(data_table.is_column_nullable_for_write(column_id, is_nullable))) { LOG_WARN("check is_column_nullable_for_write failed", K(ret), K(column_id)); } else if (new_row.get_cell(i).is_null() && !is_nullable) { bool is_hidden = false; bool is_gen_col = false; bool is_nullable_for_read = false; if (OB_FAIL(data_table.is_column_nullable_for_read(column_id, is_nullable_for_read))) { LOG_WARN("check is nullable for read failed", K(ret)); } else if (is_nullable_for_read) { LOG_TRACE("Catch a defensive nullable error, but this column is not null novalidate", K(column_id), K(column_ids), K(new_row), K(data_table)); } else if (OB_FAIL(data_table.is_hidden_column(column_id, is_hidden))) { LOG_WARN("get is hidden column failed", K(ret), K(column_id)); } else if (OB_FAIL(data_table.is_gen_column(column_id, is_gen_col))) { LOG_WARN("get is gen column failed", K(ret), K(column_id)); } else if (is_hidden && !is_gen_col) { ret = OB_BAD_NULL_ERROR; LOG_WARN("Catch a defensive nullable error, " "maybe cause by add column not null default null ONLINE", K(ret), K(column_id), K(column_ids), K(new_row), K(data_table)); } else { ret = OB_ERR_DEFENSIVE_CHECK; ObString func_name = ObString::make_string("check_new_row_nullable_value"); LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr()); LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret), K(column_id), K(column_ids), K(new_row), K(data_table)); } } else if (new_row.get_cell(i).is_number()) { number::ObNumber num; if (OB_FAIL(new_row.get_cell(i).get_number(num))) { LOG_WARN("get number value from object fail", K(ret), K(new_row.get_cell(i))); } else if (OB_FAIL(num.sanity_check())) { LOG_WARN("sanity check number failed", K(ret), K(new_row.get_cell(i))); } if (OB_SUCCESS != ret) { ret = OB_ERR_DEFENSIVE_CHECK; ObString func_name = ObString::make_string("check_new_row_nullable_value"); LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr()); LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret), K(column_id), K(column_ids), K(new_row), K(data_table)); } } } return ret; } int ObLSTabletService::check_new_row_nullable_value(const ObIArray &col_descs, ObRelativeTable &relative_table, const ObNewRow &new_row) { int ret = OB_SUCCESS; if (OB_UNLIKELY(col_descs.count() > new_row.get_count())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("new row is invalid", K(ret), K(new_row.get_count()), K(col_descs.count())); } for (int64_t i = 0; OB_SUCC(ret) && i < col_descs.count(); ++i) { uint64_t column_id = col_descs.at(i).col_id_; bool is_nullable = false; if (OB_UNLIKELY(is_shadow_column(column_id))) { //the shadow pk is generated internally, //and the nullable attribute check for it is skipped } else if (OB_FAIL(relative_table.is_column_nullable_for_write(column_id, is_nullable))) { LOG_WARN("check is_column_nullable_for_write failed", K(ret), K(column_id)); } else if (new_row.get_cell(i).is_null() && !is_nullable) { bool is_hidden = false; bool is_gen_col = false; bool is_nullable_for_read = false; if (OB_FAIL(relative_table.is_column_nullable_for_read(column_id, is_nullable_for_read))) { LOG_WARN("check is nullable for read failed", K(ret)); } else if (is_nullable_for_read) { //this column is not null novalidate, maybe the null column come from the old data //so output trace log and ignore it LOG_TRACE("Catch a defensive nullable error, but this column is not null novalidate", K(column_id), K(col_descs), K(new_row), K(relative_table)); } else if (OB_FAIL(relative_table.is_hidden_column(column_id, is_hidden))) { LOG_WARN("get is hidden column failed", K(ret), K(column_id)); } else if (OB_FAIL(relative_table.is_gen_column(column_id, is_gen_col))) { LOG_WARN("get is gen column failed", K(ret), K(column_id)); } else if (is_hidden && !is_gen_col) { ret = OB_BAD_NULL_ERROR; LOG_WARN("Catch a defensive nullable error, " "maybe cause by add column not null default null ONLINE", K(ret), K(column_id), K(col_descs), K(new_row), K(relative_table)); } else { ret = OB_ERR_DEFENSIVE_CHECK; ObString func_name = ObString::make_string("check_new_row_nullable_value"); LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr()); LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret), K(column_id), K(col_descs), K(new_row), K(relative_table)); } } else if (new_row.get_cell(i).is_number()) { number::ObNumber num; if (OB_FAIL(new_row.get_cell(i).get_number(num))) { LOG_WARN("get number value from object fail", K(ret), K(new_row.get_cell(i))); } else if (OB_FAIL(num.sanity_check())) { LOG_WARN("sanity check number failed", K(ret), K(new_row.get_cell(i))); } if (OB_SUCCESS != ret) { ret = OB_ERR_DEFENSIVE_CHECK; ObString func_name = ObString::make_string("check_new_row_nullable_value"); LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr()); LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret), K(column_id), K(col_descs), K(new_row), K(relative_table)); } } } return ret; } int ObLSTabletService::check_new_row_shadow_pk( const ObIArray &column_ids, ObRelativeTable &data_table, const ObNewRow &new_row) { int ret = OB_SUCCESS; if (data_table.get_shadow_rowkey_column_num() > 0) { //check shadow pk int64_t rowkey_cnt = data_table.get_rowkey_column_num(); int64_t spk_cnt = data_table.get_shadow_rowkey_column_num(); int64_t index_col_cnt = rowkey_cnt - spk_cnt; bool need_spk = false; if (OB_UNLIKELY(index_col_cnt <= 0) || OB_UNLIKELY(column_ids.count() < rowkey_cnt)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("index column count is invalid", K(ret), K(index_col_cnt), K(rowkey_cnt), K(spk_cnt), K(column_ids.count())); } else if (lib::is_mysql_mode()) { // mysql兼容:只要unique index key中有null列,则需要填充shadow列 bool rowkey_has_null = false; for (int64_t i = 0; !rowkey_has_null && i < index_col_cnt; i++) { rowkey_has_null = new_row.get_cell(i).is_null(); } need_spk = rowkey_has_null; } else { // oracle兼容:只有unique index key全为null列时,才需要填充shadow列 bool is_rowkey_all_null = true; for (int64_t i = 0; is_rowkey_all_null && i < index_col_cnt; i++) { is_rowkey_all_null = new_row.get_cell(i).is_null(); } need_spk = is_rowkey_all_null; } for (int64_t i = index_col_cnt; OB_SUCC(ret) && i < rowkey_cnt; ++i) { uint64_t spk_column_id = column_ids.at(i); uint64_t real_pk_id = spk_column_id - OB_MIN_SHADOW_COLUMN_ID; const ObObj &spk_value = new_row.get_cell(i); int64_t pk_idx = OB_INVALID_INDEX; int cmp = 0; if (OB_LIKELY(!need_spk)) { if (!spk_value.is_null()) { ret = OB_ERR_DEFENSIVE_CHECK; ObString func_name = ObString::make_string("check_new_row_shadow_pk"); LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr()); LOG_ERROR("Fatal Error!!! Catch a defensive error!", K(ret), "column_id", column_ids, K(new_row), K(data_table), K(spk_value), K(i), K(spk_column_id), K(real_pk_id)); } } else if (OB_UNLIKELY(!has_exist_in_array(column_ids, real_pk_id, &pk_idx))) { ret = OB_ERR_UNEXPECTED; LOG_WARN("real pk column not exists in column_ids", K(ret), K(column_ids), K(real_pk_id)); } else if (OB_FAIL(new_row.get_cell(pk_idx).compare(spk_value, cmp)) || 0 != cmp) { ret = OB_ERR_DEFENSIVE_CHECK; ObString func_name = ObString::make_string("check_new_row_shadow_pk"); LOG_USER_ERROR(OB_ERR_DEFENSIVE_CHECK, func_name.length(), func_name.ptr()); LOG_DBA_ERROR(OB_ERR_DEFENSIVE_CHECK, "msg", "Fatal Error!!! Catch a defensive error!", K(ret), "column_id", column_ids, K(new_row), K(data_table), K(spk_value), "pk_value", new_row.get_cell(pk_idx), K(pk_idx), K(i), K(spk_column_id), K(real_pk_id)); } } } return ret; } int ObLSTabletService::check_row_locked_by_myself( ObTabletHandle &tablet_handle, ObRelativeTable &relative_table, ObStoreCtx &store_ctx, const ObDatumRowkey &rowkey, bool &locked) { int ret = OB_SUCCESS; ObTablet *tablet = tablet_handle.get_obj(); if (OB_UNLIKELY(nullptr == tablet || !relative_table.is_valid() || !store_ctx.is_valid() || !rowkey.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(tablet_handle), K(relative_table), K(store_ctx), K(rowkey)); } else { ObStorageTableGuard guard(tablet, store_ctx, true); if (OB_FAIL(guard.refresh_and_protect_table(relative_table))) { LOG_WARN("fail to protect table", K(ret), K(tablet_handle)); } else if (OB_FAIL(tablet->check_row_locked_by_myself(relative_table, store_ctx, rowkey, locked))) { LOG_WARN("fail to check row locked, ", K(ret), K(rowkey)); } } return ret; } int ObLSTabletService::get_conflict_rows( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, const ObInsertFlag flag, const common::ObIArray &out_col_ids, const common::ObNewRow &row, common::ObNewRowIterator *&duplicated_rows) { TRANS_LOG(DEBUG, "get conflict rows", K(flag), K(row), K(lbt())); int ret = OB_SUCCESS; ObRelativeTable &data_table = run_ctx.relative_table_; ObArenaAllocator scan_allocator(common::ObMemAttr(MTL_ID(), ObModIds::OB_TABLE_SCAN_ITER)); ObIAllocator *allocator = &scan_allocator; ObTablet *data_tablet = tablet_handle.get_obj(); ObDatumRowkeyHelper rowkey_helper(scan_allocator); ObDatumRowkey datum_rowkey; ObStoreRowkey rowkey; rowkey.assign(row.cells_, data_table.get_rowkey_column_num()); if (OB_ISNULL(data_tablet)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("tablet is null", K(ret), K(tablet_handle)); } else { ObSingleRowGetter single_row_getter(*allocator, *data_tablet); if (OB_FAIL(init_single_row_getter(single_row_getter, run_ctx, out_col_ids, data_table, true))) { LOG_WARN("failed to init single row getter", K(ret)); } else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) { STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(rowkey)); } else if (OB_FAIL(single_get_row(single_row_getter, datum_rowkey, duplicated_rows))) { LOG_WARN("failed to single get row", K(ret)); } } if (OB_FAIL(ret)) { if (nullptr != duplicated_rows) { ObQueryIteratorFactory::free_insert_dup_iter(duplicated_rows); duplicated_rows = nullptr; } } return ret; } int ObLSTabletService::init_single_row_getter( ObSingleRowGetter &row_getter, ObDMLRunningCtx &run_ctx, const ObIArray &out_col_ids, ObRelativeTable &relative_table, bool skip_read_lob) { int ret = OB_SUCCESS; if (OB_FAIL(row_getter.init_dml_access_ctx(run_ctx.store_ctx_, run_ctx.dml_param_, skip_read_lob))) { LOG_WARN("init dml access ctx failed", K(ret)); } else if (OB_FAIL(row_getter.init_dml_access_param(relative_table, run_ctx.dml_param_, out_col_ids, skip_read_lob))) { LOG_WARN("init dml access param failed", K(ret)); } return ret; } int ObLSTabletService::single_get_row( ObSingleRowGetter &row_getter, const ObDatumRowkey &rowkey, ObNewRowIterator *&duplicated_rows) { int ret = OB_SUCCESS; ObNewRow *row = nullptr; if (OB_FAIL(row_getter.open(rowkey))) { LOG_WARN("init single row getter failed", K(ret)); } else if (OB_FAIL(row_getter.get_next_row(row))) { if (OB_ITER_END != ret) { LOG_WARN("get next row from single row getter failed", K(ret)); } else { ret = OB_SUCCESS; } } else if (NULL == duplicated_rows) { ObValueRowIterator *dup_iter = NULL; if (OB_ISNULL(dup_iter = ObQueryIteratorFactory::get_insert_dup_iter())) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("no memory to alloc ObValueRowIterator", K(ret)); } else { duplicated_rows = dup_iter; if (OB_FAIL(dup_iter->init(true))) { LOG_WARN("failed to initialize ObValueRowIterator", K(ret)); } } } if (OB_SUCC(ret) && row != nullptr) { ObValueRowIterator *dup_iter = static_cast(duplicated_rows); if (OB_FAIL(dup_iter->add_row(*row))) { LOG_WARN("failed to store conflict row", K(ret), K(*row)); } else { LOG_DEBUG("get conflict row", KPC(row)); } } return ret; } int ObLSTabletService::convert_row_to_rowkey( ObSingleRowGetter &index_row_getter, ObStoreRowkey &rowkey) { int ret = OB_SUCCESS; ObNewRow *row = nullptr; if (OB_FAIL(index_row_getter.get_next_row(row))) { if (OB_ITER_END != ret) { LOG_WARN("get next row from index row getter failed", K(ret)); } } else { rowkey.assign(row->cells_, row->count_); } return ret; } /* this func is an encapsulation of ObNewRowIterator->get_next_row. * 1. need_copy_cells is true, perform a cells copy, but not a deep copy. * memory for store_row.row_val.cells_ has already allocated before * this func is invoked, no need to alloc memory in this func. * 2. need_copy_cells is false, just perform an assignment, no any copy behavior, */ int ObLSTabletService::get_next_row_from_iter( ObNewRowIterator *row_iter, ObStoreRow &store_row, const bool need_copy_cells) { int ret = OB_SUCCESS; ObNewRow *row = nullptr; if (OB_ISNULL(row_iter)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(row_iter)); } else if (OB_FAIL(row_iter->get_next_row(row))) { if (OB_ITER_END != ret) { LOG_WARN("fail to iterate a row", K(ret), K(row)); } } else { if (need_copy_cells) { // in this situation, store_row.row_val has already hold mem for cells_, // no need to alloc mem here, we copy cells only. store_row.row_val_.count_ = row->count_; for (int64_t i = 0; i < row->count_; ++i) { store_row.row_val_.cells_[i] = row->cells_[i]; } } else { store_row.row_val_ = *row; } } return ret; } int ObLSTabletService::insert_row_to_tablet( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, ObStoreRow &tbl_row) { int ret = OB_SUCCESS; ObStoreCtx &store_ctx = run_ctx.store_ctx_; ObRelativeTable &relative_table = run_ctx.relative_table_; if (OB_UNLIKELY(!store_ctx.is_valid() || !relative_table.is_valid() || nullptr == run_ctx.col_descs_ || run_ctx.col_descs_->count() <= 0 || !tbl_row.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(store_ctx), KP(run_ctx.col_descs_), K(tbl_row), K(ret)); } else if (GCONF.enable_defensive_check() && OB_FAIL(check_new_row_legitimacy(run_ctx, tbl_row.row_val_))) { LOG_WARN("check new row legitimacy failed", K(ret), K(tbl_row.row_val_)); } else if (OB_FAIL(insert_lob_tablet_row(tablet_handle, run_ctx, tbl_row))) { LOG_WARN("failed to write lob tablets rows", K(ret)); } else { const ObColDescIArray &col_descs = *run_ctx.col_descs_; if (OB_FAIL(tablet_handle.get_obj()->insert_row_without_rowkey_check( relative_table, store_ctx, col_descs, tbl_row, run_ctx.dml_param_.encrypt_meta_))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret) { LOG_WARN("failed to write table row", K(ret), "table id", relative_table.get_table_id(), K(col_descs), K(tbl_row)); } } } return ret; } int ObLSTabletService::process_old_row_lob_col( ObTabletHandle &data_tablet_handle, ObDMLRunningCtx &run_ctx, ObStoreRow &tbl_row) { int ret = OB_SUCCESS; run_ctx.is_old_row_valid_for_lob_ = false; bool has_lob_col = false; bool need_reread = is_sys_table(run_ctx.relative_table_.get_table_id()); int64_t col_cnt = run_ctx.col_descs_->count(); if (tbl_row.row_val_.count_ != col_cnt) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]Invliad row col cnt", K(ret), K(col_cnt), K(tbl_row)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) { const ObColDesc &column = run_ctx.col_descs_->at(i); if (is_lob_storage(column.col_type_.get_type())) { has_lob_col = true; need_reread = need_reread || !(tbl_row.row_val_.cells_[i].has_lob_header()); break; } } } if (OB_SUCC(ret) && has_lob_col) { if (!need_reread) { for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) { const ObColDesc &column = run_ctx.col_descs_->at(i); if (is_lob_storage(column.col_type_.get_type())) { ObObj &obj = tbl_row.row_val_.cells_[i]; bool has_lob_header = obj.has_lob_header(); if (obj.is_null() || obj.is_nop_value()) { // do nothing } else if (!has_lob_header) { ret = OB_ERR_UNEXPECTED; LOG_WARN("lob should have lob locator here.", K(ret), K(i), K(tbl_row.row_val_.cells_[i])); } else { ObLobLocatorV2 lob(obj.get_string(), has_lob_header); ObString disk_loc; if (!lob.is_valid()) { ret = OB_ERR_UNEXPECTED; LOG_WARN("invalid lob locator.", K(ret), K(lob)); } else if (lob.is_simple()) { // do nothing } else if (OB_FAIL(lob.get_disk_locator(disk_loc))) { LOG_WARN("failed to get disk lob locator.", K(ret), K(lob)); } else { obj.set_lob_value(obj.get_type(), disk_loc.ptr(), disk_loc.length()); if (has_lob_header) { obj.set_has_lob_header(); } run_ctx.is_old_row_valid_for_lob_ = true; } } } } } else { if (OB_FAIL(table_refresh_row(data_tablet_handle, run_ctx, tbl_row.row_val_))) { LOG_WARN("[STORAGE_LOB]re-read lob col failed", K(ret)); } } } return ret; } int ObLSTabletService::table_refresh_row( ObTabletHandle &data_tablet_handle, ObDMLRunningCtx &run_ctx, ObNewRow &row) { int ret = OB_SUCCESS; ObArenaAllocator scan_allocator(common::ObMemAttr(MTL_ID(), ObModIds::OB_LOB_ACCESS_BUFFER)); ObTablet *data_tablet = data_tablet_handle.get_obj(); ObRelativeTable &data_table = run_ctx.relative_table_; ObStoreRowkey rowkey; if (OB_FAIL(rowkey.assign(row.cells_, data_table.get_rowkey_column_num()))) { LOG_WARN("get rowkey col num failed", K(ret)); } int64_t col_cnt = run_ctx.col_descs_->count(); ObSEArray out_col_ids; for (int i = 0; OB_SUCC(ret) && i < col_cnt; ++i) { if (OB_FAIL(out_col_ids.push_back(run_ctx.col_descs_->at(i).col_id_))) { LOG_WARN("push col id failed.", K(ret), K(i)); } } ObDatumRowkey datum_rowkey; ObDatumRowkeyHelper rowkey_helper(scan_allocator); ObSingleRowGetter single_row_getter(scan_allocator, *data_tablet); if (OB_FAIL(ret)) { } else if (OB_FAIL(init_single_row_getter(single_row_getter, run_ctx, out_col_ids, data_table, true))) { LOG_WARN("failed to init single row getter", K(ret)); } else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) { LOG_WARN("Failed to transfer datum rowkey", K(ret), K(rowkey)); } else { ObNewRow *new_row = nullptr; if (OB_FAIL(single_row_getter.open(datum_rowkey))) { LOG_WARN("init single row getter failed", K(ret)); } else if (OB_FAIL(single_row_getter.get_next_row(new_row))) { if (ret == OB_ITER_END) { LOG_DEBUG("re-read old row not exist", K(ret), K(row)); ret = OB_SUCCESS; } else { LOG_WARN("get next row from single row getter failed", K(ret)); } } else if (OB_ISNULL(new_row)) { ret = OB_ERR_NULL_VALUE; LOG_WARN("get next row from single row null", K(ret)); } else if (new_row->get_count() != row.get_count()) { ret = OB_ERR_UNEXPECTED; LOG_WARN("get row from single row col count not equal.", K(ret), K(row.get_count()), K(new_row->get_count())); } else { LOG_DEBUG("get new row success.", K(row), KPC(new_row)); // only write cells, not write row // passing fixed double scale from row to new_row for (int64_t i = 0; OB_SUCC(ret) && i < new_row->get_count(); ++i) { if (row.cells_[i].is_fixed_double()) { new_row->cells_[i].set_scale(row.cells_[i].get_scale()); } else if (OB_FAIL(ob_write_obj(run_ctx.lob_allocator_, new_row->cells_[i], row.cells_[i]))) { LOG_WARN("copy ObObj error", K(ret), K(i), K(new_row->cells_[i])); } } if (OB_SUCC(ret)) { run_ctx.is_old_row_valid_for_lob_ = true; } } } return ret; } int ObLSTabletService::delete_row_in_tablet( ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx, const ObNewRow &row) { int ret = OB_SUCCESS; const ObDMLBaseParam &dml_param = run_ctx.dml_param_; ObStoreCtx &ctx = run_ctx.store_ctx_; ObRelativeTable &relative_table = run_ctx.relative_table_; ObStoreRow &tbl_row = run_ctx.tbl_row_; ObStoreRow new_tbl_row; ObSEArray update_idx; // update_idx is a dummy param here tbl_row.flag_.set_flag(ObDmlFlag::DF_DELETE); tbl_row.row_val_ = row; if (OB_FAIL(check_old_row_legitimacy(tablet_handle, run_ctx, row))) { if (OB_ERR_DEFENSIVE_CHECK == ret) { dump_diag_info_for_old_row_loss(relative_table, ctx, tbl_row); } LOG_WARN("check old row legitimacy failed", K(row)); } else if (OB_FAIL(process_old_row_lob_col(tablet_handle, run_ctx, tbl_row))) { LOG_WARN("failed to process old row lob col", K(ret), K(tbl_row)); } else if (OB_FAIL(delete_lob_tablet_rows(run_ctx, tablet_handle, tbl_row, row))) { LOG_WARN("failed to delete lob rows.", K(ret), K(tbl_row), K(row)); } else if (!dml_param.is_total_quantity_log_) { if (OB_FAIL(tablet_handle.get_obj()->insert_row_without_rowkey_check(relative_table, ctx, *run_ctx.col_descs_, tbl_row, dml_param.encrypt_meta_))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("failed to set row", K(ret), K(*run_ctx.col_descs_), K(tbl_row)); } } } else { update_idx.reset(); // update_idx is a dummy param here new_tbl_row.reset(); new_tbl_row.flag_.set_flag(ObDmlFlag::DF_DELETE); new_tbl_row.row_val_ = tbl_row.row_val_; tbl_row.flag_.set_flag(ObDmlFlag::DF_UPDATE); if (OB_FAIL(tablet_handle.get_obj()->update_row(relative_table, ctx, *run_ctx.col_descs_, update_idx, tbl_row, new_tbl_row, dml_param.encrypt_meta_))) { if (OB_TRY_LOCK_ROW_CONFLICT != ret && OB_TRANSACTION_SET_VIOLATION != ret) { LOG_WARN("failed to set row", K(ret), K(*run_ctx.col_descs_), K(tbl_row), K(new_tbl_row)); } } else { LOG_DEBUG("succeeded to del main table row", K(tbl_row), K(new_tbl_row)); } } return ret; } int ObLSTabletService::delete_lob_col( ObDMLRunningCtx &run_ctx, const ObColDesc &column, ObObj &obj, const ObObj &sql_obj, ObLobCommon *&lob_common, ObLobAccessParam &lob_param) { int ret = OB_SUCCESS; ObLobManager *lob_mngr = MTL(ObLobManager*); if (OB_ISNULL(lob_mngr)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]get lob manager instance failed.", K(ret)); } else if (!column.col_type_.is_lob_storage() || obj.is_nop_value() || obj.is_null() || !run_ctx.is_old_row_valid_for_lob_) { // do nothing } else { ObString data = obj.get_string(); // Notice: Only disk locator here! ObString sql_data = sql_obj.get_string(); if (data.length() < sizeof(ObLobCommon)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]Invalid Lob data.", K(ret), K(obj), K(data)); } else { void *buf = run_ctx.lob_allocator_.alloc(data.length()); if (OB_ISNULL(buf)) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("failed to deep copy lob data.", K(ret), K(data)); } else { MEMCPY(buf, data.ptr(), data.length()); lob_common = reinterpret_cast(buf); lob_param.tx_desc_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_desc_; lob_param.parent_seq_no_ = run_ctx.store_ctx_.mvcc_acc_ctx_.tx_scn_; lob_param.snapshot_ = run_ctx.dml_param_.snapshot_; lob_param.tx_id_ = lob_param.tx_desc_->get_tx_id(); lob_param.sql_mode_ = run_ctx.dml_param_.sql_mode_; lob_param.is_total_quantity_log_ = run_ctx.dml_param_.is_total_quantity_log_; lob_param.ls_id_ = run_ctx.store_ctx_.ls_id_; lob_param.tablet_id_ = run_ctx.relative_table_.get_tablet_id(); lob_param.coll_type_ = column.col_type_.get_collation_type(); lob_param.allocator_ = &run_ctx.lob_allocator_; lob_param.lob_common_ = lob_common; lob_param.handle_size_ = data.length(); lob_param.byte_size_ = lob_param.lob_common_->get_byte_size(data.length()); lob_param.timeout_ = run_ctx.dml_param_.timeout_; lob_param.scan_backward_ = false; lob_param.offset_ = 0; // use byte size to delete all lob_param.len_ = lob_param.byte_size_; //ObCharset::strlen_char(lob_param.coll_type_, sql_data.ptr(), sql_data.length()); if (lob_param.byte_size_ < 0) { ret = OB_ERR_UNEXPECTED; LOG_WARN("calc byte size is negative.", K(ret), K(data), K(lob_param)); } else if (OB_FAIL(lob_mngr->erase(lob_param))) { LOG_WARN("[STORAGE_LOB]lob erase failed.", K(ret), K(lob_param)); } } } } return ret; } int ObLSTabletService::delete_lob_tablet_rows( ObDMLRunningCtx &run_ctx, ObTabletHandle &data_tablet, ObStoreRow &tbl_row, const ObNewRow &row) { int ret = OB_SUCCESS; int64_t col_cnt = run_ctx.col_descs_->count(); if (tbl_row.row_val_.count_ != col_cnt) { ret = OB_ERR_UNEXPECTED; LOG_WARN("[STORAGE_LOB]Invliad row col cnt", K(col_cnt), K(tbl_row)); } else { ObLobCommon *lob_common = nullptr; for (int64_t i = 0; OB_SUCC(ret) && i < col_cnt; ++i) { const ObColDesc &column = run_ctx.col_descs_->at(i); if (column.col_type_.is_lob_storage()) { ObObj &obj = tbl_row.row_val_.get_cell(i); const ObObj &sql_obj = row.get_cell(i); ObLobAccessParam lob_param; if (OB_FAIL(delete_lob_col(run_ctx, column, obj, sql_obj, lob_common, lob_param))) { LOG_WARN("[STORAGE_LOB]failed to erase lob col.", K(ret), K(i), K(tbl_row)); } } } } return ret; } int ObLSTabletService::prepare_scan_table_param( ObTableScanParam ¶m, share::schema::ObMultiVersionSchemaService &schema_service) { int ret = OB_SUCCESS; if (NULL == param.table_param_ || OB_INVALID_ID == param.table_param_->get_table_id()) { void *buf = NULL; ObTableParam *table_param = NULL; ObSchemaGetterGuard schema_guard; const ObTableSchema *table_schema = NULL; const uint64_t tenant_id = MTL_ID(); const bool check_formal = param.index_id_ > OB_MAX_CORE_TABLE_ID; if (OB_FAIL(schema_service.get_tenant_schema_guard(tenant_id, schema_guard))) { LOG_WARN("failed to get schema manager", K(ret), K(tenant_id)); } else if (check_formal && OB_FAIL(schema_guard.check_formal_guard())) { LOG_WARN("Fail to check formal schema, ", K(param.index_id_), K(ret)); } else if (OB_FAIL(schema_guard.get_table_schema(tenant_id, param.index_id_, table_schema))) { LOG_WARN("Fail to get table schema", K(param.index_id_), K(ret)); } else if (NULL == table_schema) { ret = OB_TABLE_NOT_EXIST; LOG_WARN("table not exist", K(param.index_id_), K(ret)); } else { if (NULL == (buf = param.allocator_->alloc(sizeof(ObTableParam)))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("Fail to allocate memory, ", K(ret)); } else { //TODO table param should not generate twice!!!! table_param = new (buf) ObTableParam(*param.allocator_); table_param->get_enable_lob_locator_v2() = (!IS_CLUSTER_VERSION_BEFORE_4_1_0_0); if (OB_FAIL(table_param->convert(*table_schema, param.column_ids_, param.pd_storage_flag_))) { LOG_WARN("Fail to convert table param, ", K(ret)); } else { param.table_param_ = table_param; } } } } return ret; } void ObLSTabletService::dump_diag_info_for_old_row_loss( ObRelativeTable &data_table, ObStoreCtx &store_ctx, const ObStoreRow &tbl_row) { int ret = OB_SUCCESS; ObArenaAllocator allocator(common::ObMemAttr(MTL_ID(), "DumpDIAGInfo")); ObTableAccessParam access_param; ObTableAccessContext access_ctx; ObSEArray out_col_pros; ObStoreRowkey rowkey; ObDatumRowkey datum_rowkey; ObDatumRowkeyHelper rowkey_helper(allocator); const int64_t schema_rowkey_cnt = data_table.get_rowkey_column_num(); ObTableStoreIterator &table_iter = *data_table.tablet_iter_.table_iter(); ObQueryFlag query_flag(ObQueryFlag::Forward, false, /*is daily merge scan*/ false, /*is read multiple macro block*/ false, /*sys task scan, read one macro block in single io*/ false /*is full row scan?*/, false, false); common::ObVersionRange trans_version_rang; trans_version_rang.base_version_ = 0; trans_version_rang.multi_version_start_ = 0; trans_version_rang.snapshot_version_ = store_ctx.mvcc_acc_ctx_.get_snapshot_version().get_val_for_tx(); const share::schema::ObTableSchemaParam *schema_param = data_table.get_schema_param(); const ObITableReadInfo *read_info = &schema_param->get_read_info(); for (int64_t i = 0; OB_SUCC(ret) && i < read_info->get_request_count(); i++) { if (OB_FAIL(out_col_pros.push_back(i))) { STORAGE_LOG(WARN, "Failed to push back col project", K(ret), K(i)); } } if (OB_FAIL(ret)) { } else if (OB_FAIL(rowkey.assign(tbl_row.row_val_.cells_, schema_rowkey_cnt))) { LOG_WARN("Failed to assign rowkey", K(ret)); } else if (OB_FAIL(rowkey_helper.convert_datum_rowkey(rowkey.get_rowkey(), datum_rowkey))) { STORAGE_LOG(WARN, "Failed to transfer datum rowkey", K(ret), K(rowkey)); } else if (OB_FAIL(access_ctx.init(query_flag, store_ctx, allocator, trans_version_rang))) { LOG_WARN("Fail to init access ctx", K(ret)); } else { access_param.is_inited_ = true; access_param.iter_param_.table_id_ = data_table.get_table_id(); access_param.iter_param_.tablet_id_ = data_table.tablet_iter_.get_tablet()->get_tablet_meta().tablet_id_; access_param.iter_param_.read_info_ = read_info; access_param.iter_param_.out_cols_project_ = &out_col_pros; ObStoreRowIterator *getter = nullptr; ObITable *table = nullptr; const ObDatumRow *row = nullptr; FLOG_INFO("Try to find the specified rowkey within all the sstable", K(tbl_row), K(table_iter)); FLOG_INFO("Prepare the diag env to dump the rows", K(store_ctx), K(rowkey), K(datum_rowkey), K(access_ctx.trans_version_range_)); table_iter.resume(); while (OB_SUCC(ret)) { if (OB_FAIL(table_iter.get_next(table))) { if (OB_ITER_END != ret) { LOG_WARN("failed to get next tables", K(ret)); } } else if (OB_ISNULL(table)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("table must not be null", K(ret), K(table_iter)); } else if (OB_FAIL(table->get(access_param.iter_param_, access_ctx, datum_rowkey, getter))) { LOG_WARN("Failed to get param", K(ret), KPC(table)); } else if (OB_FAIL(getter->get_next_row(row))) { LOG_WARN("Failed to get next row", K(ret), KPC(table)); } else if (row->row_flag_.is_not_exist() || row->row_flag_.is_delete()){ FLOG_INFO("Cannot found rowkey in the table", KPC(row), KPC(table)); } else if (table->is_sstable()) { FLOG_INFO("Found rowkey in the sstable", KPC(row), KPC(reinterpret_cast(table))); } else { FLOG_INFO("Found rowkey in the memtable", KPC(row), KPC(reinterpret_cast(table))); } // ignore error in the loop if (OB_FAIL(ret) && OB_ITER_END != ret) { ret = OB_SUCCESS; } if (OB_NOT_NULL(getter)) { getter->~ObStoreRowIterator(); getter = nullptr; } } if (OB_ITER_END == ret) { ret = OB_SUCCESS; } if (OB_SUCC(ret)) { FLOG_INFO("prepare to use single merge to find row", K(rowkey), K(datum_rowkey), K(access_param)); ObSingleMerge *get_merge = nullptr; ObGetTableParam get_table_param; ObDatumRow *row = nullptr; get_table_param.tablet_iter_ = data_table.tablet_iter_; void *buf = nullptr; if (OB_ISNULL(buf = allocator.alloc(sizeof(ObSingleMerge)))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("Failed to alloc memory for single merge", K(ret)); } else if (FALSE_IT(get_merge = new(buf)ObSingleMerge())) { } else if (OB_FAIL(get_merge->init(access_param, access_ctx, get_table_param))) { LOG_WARN("Failed to init single get merge", K(ret)); } else if (OB_FAIL(get_merge->open(datum_rowkey))) { LOG_WARN("Failed to open single merge", K(ret)); } else if (FALSE_IT(get_merge->disable_fill_default())) { } else { while (OB_SUCC(get_merge->get_next_row(row))) { FLOG_INFO("Found one row for the rowkey", KPC(row)); } FLOG_INFO("Finish to find rowkey with single merge", K(ret), K(rowkey), K(datum_rowkey)); } if (OB_NOT_NULL(get_merge)) { get_merge->~ObSingleMerge(); get_merge = nullptr; } } #ifdef ENABLE_DEBUG_LOG // print single row check info if (store_ctx.mvcc_acc_ctx_.tx_id_.is_valid()) { transaction::ObTransService *trx = MTL(transaction::ObTransService *); if (OB_NOT_NULL(trx) && NULL != trx->get_defensive_check_mgr()) { (void)trx->get_defensive_check_mgr()->dump(store_ctx.mvcc_acc_ctx_.tx_id_); } } #endif } } int ObLSTabletService::prepare_dml_running_ctx( const common::ObIArray *column_ids, const common::ObIArray *upd_col_ids, ObTabletHandle &tablet_handle, ObDMLRunningCtx &run_ctx) { int ret = OB_SUCCESS; if (OB_FAIL(run_ctx.init( column_ids, upd_col_ids, MTL(ObTenantSchemaService*)->get_schema_service(), tablet_handle))) { LOG_WARN("failed to init run ctx", K(ret)); } return ret; } int ObLSTabletService::get_ls_min_end_scn( SCN &min_end_scn_from_latest_tablets, SCN &min_end_scn_from_old_tablets) { int ret = OB_SUCCESS; const ObLSID &ls_id = ls_->get_ls_id(); ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); ObSArray tablet_ids; GetAllTabletIDOperator op(tablet_ids, true/*except_ls_inner_tablet*/); min_end_scn_from_latest_tablets.set_max(); min_end_scn_from_old_tablets.set_max(); if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_FAIL(tablet_id_set_.foreach(op))) { STORAGE_LOG(WARN, "fail to get all tablet ids from set", K(ret)); } else { SCN ls_checkpoint = ls_->get_clog_checkpoint_scn(); for (int64_t i = 0; OB_SUCC(ret) && i < tablet_ids.count(); ++i) { ObTabletMapKey key(ls_id, tablet_ids.at(i)); SCN min_end_scn_from_latest = SCN::max_scn(); SCN min_end_scn_from_old = SCN::max_scn(); if (OB_FAIL(t3m->get_min_end_scn_for_ls(key, ls_checkpoint, min_end_scn_from_latest, min_end_scn_from_old))) { if (OB_ENTRY_NOT_EXIST != ret) { LOG_WARN("fail to get min end scn", K(ret), K(key)); } else { ret = OB_SUCCESS; } } else { if (min_end_scn_from_latest < min_end_scn_from_latest_tablets) { LOG_DEBUG("update", K(key), K(min_end_scn_from_latest_tablets), K(min_end_scn_from_latest)); min_end_scn_from_latest_tablets = min_end_scn_from_latest; } if (min_end_scn_from_old < min_end_scn_from_old_tablets) { LOG_DEBUG("update", K(key), K(min_end_scn_from_old_tablets), K(min_end_scn_from_old)); min_end_scn_from_old_tablets = min_end_scn_from_old; } } } LOG_INFO("get ls min end scn finish", K(ls_checkpoint)); } return ret; } int ObLSTabletService::get_multi_ranges_cost( const ObTabletID &tablet_id, const common::ObIArray &ranges, int64_t &total_size) { int ret = OB_SUCCESS; ObTabletTableIterator iter; const int64_t max_snapshot_version = INT64_MAX; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret)); } else if (OB_FAIL(get_read_tables(tablet_id, max_snapshot_version, iter))) { LOG_WARN("fail to get all read tables", K(ret), K(tablet_id), K(max_snapshot_version)); } else { ObPartitionMultiRangeSpliter spliter; if (OB_FAIL(spliter.get_multi_range_size( ranges, iter.get_tablet()->get_rowkey_read_info(), *iter.table_iter(), total_size))) { LOG_WARN("fail to get multi ranges cost", K(ret), K(ranges)); } } return ret; } int ObLSTabletService::split_multi_ranges( const ObTabletID &tablet_id, const ObIArray &ranges, const int64_t expected_task_count, common::ObIAllocator &allocator, ObArrayArray &multi_range_split_array) { int ret = OB_SUCCESS; ObTabletTableIterator iter; const int64_t max_snapshot_version = INT64_MAX; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret)); } else if (OB_FAIL(get_read_tables(tablet_id, max_snapshot_version, iter))) { LOG_WARN("fail to get all read tables", K(ret), K(tablet_id), K(max_snapshot_version)); } else { ObPartitionMultiRangeSpliter spliter; if (OB_FAIL(spliter.get_split_multi_ranges( ranges, expected_task_count, iter.get_tablet()->get_rowkey_read_info(), *iter.table_iter(), allocator, multi_range_split_array))) { LOG_WARN("fail to get splitted ranges", K(ret), K(ranges), K(expected_task_count)); } } return ret; } int ObLSTabletService::estimate_row_count( const ObTableScanParam ¶m, const ObTableScanRange &scan_range, ObIArray &est_records, int64_t &logical_row_count, int64_t &physical_row_count) { int ret = OB_SUCCESS; ObPartitionEst batch_est; ObTabletTableIterator tablet_iter; common::ObSEArray tables; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!param.is_estimate_valid() || !scan_range.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid argument", K(ret), K(param), K(scan_range)); } else if (scan_range.is_empty()) { } else { const int64_t snapshot_version = -1 == param.frozen_version_ ? GET_BATCH_ROWS_READ_SNAPSHOT_VERSION : param.frozen_version_; if (OB_FAIL(get_read_tables(param.tablet_id_, snapshot_version, tablet_iter, false))) { if (OB_TABLET_NOT_EXIST != ret) { LOG_WARN("failed to get tablet_iter", K(ret), K(snapshot_version), K(param)); } } else { while(OB_SUCC(ret)) { ObITable *table = nullptr; if (OB_FAIL(tablet_iter.table_iter()->get_next(table))) { if (OB_ITER_END != ret) { LOG_WARN("failed to get next table", K(ret), K(tablet_iter.table_iter())); } else { ret = OB_SUCCESS; break; } } else if (OB_ISNULL(table)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("table shoud not be null", K(ret), K(tablet_iter.table_iter())); } else if (table->is_sstable() && static_cast(table)->is_empty()) { LOG_DEBUG("cur sstable is empty", K(ret), K(*table)); continue; } if (OB_SUCC(ret) && OB_FAIL(tables.push_back(table))) { LOG_WARN("failed to push back table", K(ret), K(tables)); } } } if (OB_SUCC(ret) && tables.count() > 0) { ObTableEstimateBaseInput base_input(param.scan_flag_, param.index_id_, param.tx_id_, tables, tablet_iter.get_tablet_handle()); if (scan_range.is_get()) { if (OB_FAIL(ObTableEstimator::estimate_row_count_for_get(base_input, scan_range.get_rowkeys(), batch_est))) { LOG_WARN("failed to estimate row count", K(ret), K(param), K(scan_range)); } } else if (OB_FAIL(ObTableEstimator::estimate_row_count_for_scan(base_input, scan_range.get_ranges(), batch_est, est_records))) { LOG_WARN("failed to estimate row count", K(ret), K(param), K(scan_range)); } } } if (OB_SUCC(ret)) { logical_row_count = batch_est.logical_row_count_; physical_row_count = batch_est.physical_row_count_; } LOG_DEBUG("estimate result", K(ret), K(batch_est), K(est_records)); return ret; } int ObLSTabletService::estimate_block_count_and_row_count( const common::ObTabletID &tablet_id, int64_t ¯o_block_count, int64_t µ_block_count, int64_t &sstable_row_count, int64_t &memtable_row_count, common::ObIArray &cg_macro_cnt_arr, common::ObIArray &cg_micro_cnt_arr) { int ret = OB_SUCCESS; macro_block_count = 0; micro_block_count = 0; sstable_row_count = 0; memtable_row_count = 0; ObTabletTableIterator tablet_iter; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_FAIL(get_read_tables(tablet_id, INT64_MAX, tablet_iter, false/*allow_no_ready_read*/))) { LOG_WARN("failed to get read tables", K(ret)); } ObITable *table = nullptr; ObSSTable *sstable = nullptr; cg_macro_cnt_arr.reset(); cg_micro_cnt_arr.reset(); while (OB_SUCC(ret)) { ObSSTableMetaHandle sst_meta_hdl; if (OB_FAIL(tablet_iter.table_iter()->get_next(table))) { if (OB_ITER_END != ret) { LOG_WARN("failed to get next tables", K(ret)); } else { ret = OB_SUCCESS; break; } } else if (OB_ISNULL(table)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("get unexpected null table", K(ret), K(tablet_iter.table_iter())); } else if (table->is_memtable()) { memtable_row_count += static_cast(table)->get_physical_row_cnt(); } else if (table->is_sstable()) { sstable = static_cast(table); if (OB_FAIL(sstable->get_meta(sst_meta_hdl))) { LOG_WARN("fail to get sstable meta handle", K(ret)); } else { sstable = static_cast(table); macro_block_count += sstable->get_data_macro_block_count(); micro_block_count += sst_meta_hdl.get_sstable_meta().get_data_micro_block_count(); sstable_row_count += sst_meta_hdl.get_sstable_meta().get_row_count(); } } if (OB_SUCC(ret) && table->is_co_sstable()) { ObCOSSTableV2 *co_sstable = static_cast(table); common::ObArray tables; if (OB_FAIL(co_sstable->get_all_tables(tables))) { LOG_WARN("fail to get all tables", K(ret), KPC(co_sstable)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < tables.count(); i++) { ObITable *cg_table = tables.at(i); ObSSTableMetaHandle co_sst_meta_hdl; if (OB_UNLIKELY(cg_table == nullptr || !cg_table->is_sstable())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected cg table", K(ret), KPC(cg_table)); } else if (FALSE_IT(sstable = static_cast(cg_table))) { } else if (OB_FAIL(sstable->get_meta(co_sst_meta_hdl))) { LOG_WARN("fail to get sstable meta handle", K(ret)); } else if (OB_FAIL(cg_macro_cnt_arr.push_back(sstable->get_data_macro_block_count()))) { LOG_WARN("fail to push macro count", K(ret)); } else if (OB_FAIL(cg_micro_cnt_arr.push_back(co_sst_meta_hdl.get_sstable_meta().get_data_micro_block_count()))) { LOG_WARN("fail to push micro count", K(ret)); } } } } } return ret; } int ObLSTabletService::get_tx_data_memtable_mgr(ObMemtableMgrHandle &mgr_handle) { mgr_handle.reset(); return mgr_handle.set_memtable_mgr(&tx_data_memtable_mgr_); } int ObLSTabletService::get_tx_ctx_memtable_mgr(ObMemtableMgrHandle &mgr_handle) { mgr_handle.reset(); return mgr_handle.set_memtable_mgr(&tx_ctx_memtable_mgr_); } int ObLSTabletService::get_lock_memtable_mgr(ObMemtableMgrHandle &mgr_handle) { mgr_handle.reset(); return mgr_handle.set_memtable_mgr(&lock_memtable_mgr_); } int ObLSTabletService::get_mds_table_mgr(mds::MdsTableMgrHandle &mgr_handle) { mgr_handle.reset(); return mgr_handle.set_mds_table_mgr(&mds_table_mgr_); } int ObLSTabletService::create_ls_inner_tablet( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id, const SCN &major_frozen_scn, const share::schema::ObTableSchema &table_schema, const lib::Worker::CompatMode &compat_mode, const SCN &create_scn) { int ret = OB_SUCCESS; bool b_exist = false; ObTabletHandle tablet_handle; common::ObTabletID empty_tablet_id; ObMetaDiskAddr disk_addr; const int64_t snapshot_version = major_frozen_scn.get_val_for_tx(); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!ls_id.is_valid()) || OB_UNLIKELY(!tablet_id.is_valid()) || OB_UNLIKELY(!major_frozen_scn.is_valid()) || OB_UNLIKELY(!table_schema.is_valid()) || OB_UNLIKELY(lib::Worker::CompatMode::INVALID == compat_mode) || OB_UNLIKELY(!create_scn.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ls_id), K(tablet_id), K(major_frozen_scn), K(table_schema), K(compat_mode), K(create_scn)); } else if (OB_UNLIKELY(ls_id != ls_->get_ls_id())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("ls id is unexpected", K(ret), "arg_ls_id", ls_id, "ls_id", ls_->get_ls_id()); } else if (OB_UNLIKELY(!tablet_id.is_ls_inner_tablet())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("tablet id is not ls inner tablet", K(ret), K(tablet_id)); } else if (OB_FAIL(has_tablet(ls_id, tablet_id, b_exist))) { LOG_WARN("failed to check tablet existence", K(ret), K(ls_id), K(tablet_id)); } else if (OB_UNLIKELY(b_exist)) { ret = OB_TABLET_EXIST; LOG_WARN("tablet already exists", K(ret), K(ls_id), K(tablet_id)); } else if (OB_FAIL(create_inner_tablet(ls_id, tablet_id, tablet_id/*data_tablet_id*/, create_scn, snapshot_version, table_schema, compat_mode, tablet_handle))) { LOG_WARN("failed to do create tablet", K(ret), K(ls_id), K(tablet_id), K(create_scn), K(major_frozen_scn), K(table_schema), K(compat_mode)); } return ret; } int ObLSTabletService::remove_ls_inner_tablet( const share::ObLSID &ls_id, const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; common::ObSEArray tablet_id_array; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else if (OB_UNLIKELY(!ls_id.is_valid()) || OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid args", K(ret), K(ls_id), K(tablet_id)); } else if (OB_UNLIKELY(ls_id != ls_->get_ls_id())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("ls id is unexpected", K(ret), "arg_ls_id", ls_id, "ls_id", ls_->get_ls_id()); } else if (OB_FAIL(do_remove_tablet(ObTabletMapKey(ls_id, tablet_id)))) { LOG_WARN("failed to remove tablet", K(ret), K(ls_id), K(tablet_id)); } return ret; } int ObLSTabletService::build_tablet_iter(ObLSTabletIterator &iter, const bool except_ls_inner_tablet) { int ret = common::OB_SUCCESS; GetAllTabletIDOperator op(iter.tablet_ids_, except_ls_inner_tablet); iter.ls_tablet_service_ = this; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; STORAGE_LOG(WARN, "not inited", K(ret), K_(is_inited)); } else if (OB_FAIL(tablet_id_set_.foreach(op))) { STORAGE_LOG(WARN, "fail to get all tablet ids from set", K(ret)); } else if (OB_UNLIKELY(!iter.is_valid())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("iter is invalid", K(ret), K(iter)); } if (OB_FAIL(ret)) { iter.reset(); } return ret; } int ObLSTabletService::build_tablet_iter(ObHALSTabletIDIterator &iter) { int ret = common::OB_SUCCESS; GetAllTabletIDOperator op(iter.tablet_ids_); if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; STORAGE_LOG(WARN, "not inited", K(ret), K_(is_inited)); } else if (OB_FAIL(tablet_id_set_.foreach(op))) { STORAGE_LOG(WARN, "fail to get all tablet ids from set", K(ret)); } else if (OB_UNLIKELY(!iter.is_valid())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("iter is invalid", K(ret), K(iter)); } if (OB_FAIL(ret)) { iter.reset(); } return ret; } int ObLSTabletService::build_tablet_iter(ObHALSTabletIterator &iter) { int ret = common::OB_SUCCESS; iter.ls_tablet_service_ = this; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; STORAGE_LOG(WARN, "not inited", K(ret), K_(is_inited)); } else if (OB_FAIL(build_tablet_iter(iter.tablet_id_iter_))) { STORAGE_LOG(WARN, "fail to build ha tablet id iterator", K(ret)); } if (OB_FAIL(ret)) { iter.reset(); } return ret; } int ObLSTabletService::set_allow_to_read_(ObLS *ls) { int ret = OB_SUCCESS; ObMigrationStatus migration_status = ObMigrationStatus::OB_MIGRATION_STATUS_MAX; share::ObLSRestoreStatus restore_status; if (OB_ISNULL(ls)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("set allow to read get invalid argument", K(ret), KP(ls)); } else { if (OB_FAIL(ls->get_migration_and_restore_status(migration_status, restore_status))) { LOG_WARN("failed to get ls migration and restore status", K(ret), KPC(ls)); } else if ((ObMigrationStatus::OB_MIGRATION_STATUS_NONE != migration_status && ObMigrationStatus::OB_MIGRATION_STATUS_HOLD != migration_status) || ObLSRestoreStatus::RESTORE_NONE != restore_status) { allow_to_read_mgr_.disable_to_read(); FLOG_INFO("set ls do not allow to read", KPC(ls), K(migration_status), K(restore_status)); } else { allow_to_read_mgr_.enable_to_read(); } } return ret; } void ObLSTabletService::enable_to_read() { allow_to_read_mgr_.enable_to_read(); } void ObLSTabletService::disable_to_read() { allow_to_read_mgr_.disable_to_read(); } int ObLSTabletService::GetAllTabletIDOperator::operator()(const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!tablet_id.is_valid())) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id)); } else if (except_ls_inner_tablet_ && tablet_id.is_ls_inner_tablet()) { // do nothing } else if (OB_FAIL(tablet_ids_.push_back(tablet_id))) { LOG_WARN("failed to push back tablet id", K(ret), K(tablet_id)); } return ret; } int ObLSTabletService::DestroyMemtableAndMemberAndMdsTableOperator::operator()(const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; ObTenantMetaMemMgr *t3m = MTL(ObTenantMetaMemMgr*); cur_tablet_id_ = tablet_id; if (OB_UNLIKELY(!tablet_id.is_valid()) || OB_ISNULL(tablet_svr_)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_svr_)); } else if (OB_ISNULL(tablet_svr_->ls_)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("ls is null", K(ret)); } else { const ObTabletMapKey key(tablet_svr_->ls_->get_ls_id(), tablet_id); if (OB_FAIL(t3m->release_memtable_and_mds_table_for_ls_offline(key))) { LOG_WARN("failed to release memtables and mds table", K(ret), K(key)); } } return ret; } int ObLSTabletService::SetMemtableFrozenOperator::operator()(const common::ObTabletID &tablet_id) { int ret = OB_SUCCESS; ObTabletHandle handle; cur_tablet_id_ = tablet_id; if (OB_UNLIKELY(!tablet_id.is_valid()) || OB_ISNULL(tablet_svr_)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid arguments", K(ret), K(tablet_id), K(tablet_svr_)); } else if (OB_FAIL(tablet_svr_->get_tablet(tablet_id, handle, ObTabletCommon::DEFAULT_GET_TABLET_NO_WAIT, ObMDSGetTabletMode::READ_WITHOUT_CHECK))) { if (OB_TABLET_NOT_EXIST == ret) { LOG_WARN("failed to get tablet, skip set memtable frozen", K(ret), K(tablet_id)); ret = OB_SUCCESS; } else { LOG_ERROR("failed to get tablet", K(ret), K(tablet_id)); } } else if (OB_FAIL(handle.get_obj()->set_frozen_for_all_memtables())) { LOG_WARN("failed to set frozen for all memtables", K(ret), K(tablet_id)); } return ret; } void ObLSTabletService::AllowToReadMgr::disable_to_read() { AllowToReadInfo read_info; AllowToReadInfo next_read_info; do { LOAD128(read_info, &read_info_); if (!read_info.allow_to_read()) { break; } else { next_read_info.info_.allow_to_read_ = 0; next_read_info.info_.seq_ = read_info.info_.seq_ + 1; } } while (!CAS128(&read_info_, read_info, next_read_info)); } void ObLSTabletService::AllowToReadMgr::enable_to_read() { AllowToReadInfo read_info; AllowToReadInfo next_read_info; do { LOAD128(read_info, &read_info_); if (read_info.allow_to_read()) { break; } else { next_read_info.info_.allow_to_read_ = 1; next_read_info.info_.seq_ = read_info.info_.seq_; } } while (!CAS128(&read_info_, read_info, next_read_info)); } void ObLSTabletService::AllowToReadMgr::load_allow_to_read_info( AllowToReadInfo &read_info) { LOAD128(read_info, &read_info_); } void ObLSTabletService::AllowToReadMgr::check_read_info_same( const AllowToReadInfo &read_info, bool &is_same) { AllowToReadInfo current_read_info; LOAD128(current_read_info, &read_info_); is_same = read_info == current_read_info; } int ObLSTabletService::get_all_tablet_ids( const bool except_ls_inner_tablet, common::ObIArray &tablet_id_array) { int ret = OB_SUCCESS; GetAllTabletIDOperator op(tablet_id_array, except_ls_inner_tablet); if (OB_FAIL(tablet_id_set_.foreach(op))) { LOG_WARN("failed to traverse tablet id set", K(ret)); } return ret; } int ObLSTabletService::flush_mds_table(int64_t recycle_scn) { int ret = OB_SUCCESS; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("ls tablet service is not init", KR(ret), KPC(this)); } else if (OB_FAIL(mds_table_mgr_.flush(SCN::max_scn(), true))) { LOG_WARN("flush mds table failed", KR(ret), KPC(this)); } LOG_INFO("finish flush mds table", KR(ret), K(recycle_scn)); return ret; } int ObLSTabletService::set_frozen_for_all_memtables() { int ret = OB_SUCCESS; if (IS_NOT_INIT) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else { SetMemtableFrozenOperator set_mem_frozen_op(this); if (OB_FAIL(tablet_id_set_.foreach(set_mem_frozen_op))) { LOG_WARN("fail to set memtables frozen", K(ret), K(set_mem_frozen_op.cur_tablet_id_)); } } return ret; } int ObLSTabletService::ha_scan_all_tablets(const HandleTabletMetaFunc &handle_tablet_meta_f) { int ret = OB_SUCCESS; if (OB_UNLIKELY(!is_inited_)) { ret = OB_NOT_INIT; LOG_WARN("not inited", K(ret), K_(is_inited)); } else { ObHALSTabletIterator iterator(ls_->get_ls_id(), false/* need_initial_state */); if (OB_FAIL(build_tablet_iter(iterator))) { LOG_WARN("fail to build tablet iterator", K(ret), KPC(this)); } else { ObTabletHandle tablet_handle; ObTablet *tablet = nullptr; obrpc::ObCopyTabletInfo tablet_info; ObTabletCreateDeleteMdsUserData user_data; bool committed_flag = false; while (OB_SUCC(ret)) { tablet_info.reset(); user_data.reset(); committed_flag = false; if (OB_FAIL(iterator.get_next_tablet(tablet_handle))) { if (OB_ITER_END == ret) { ret = OB_SUCCESS; break; } else { LOG_WARN("failed to get tablet", K(ret)); } } else if (OB_ISNULL(tablet = tablet_handle.get_obj())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("tablet is nullptr", K(ret), K(tablet_handle)); } else if (OB_FAIL(tablet->ObITabletMdsInterface::get_latest_tablet_status(user_data, committed_flag))) { if (OB_EMPTY_RESULT == ret) { ret = OB_SUCCESS; } else { LOG_WARN("failed to get latest tablet status", K(ret), KPC(tablet)); } } else if (!committed_flag && ObTabletStatus::TRANSFER_IN == user_data.tablet_status_) { //TODO(muwei.ym) CAN NOT USE this condition when MDS supports uncommitted transaction // why we should skip uncommited transfer in tablet, because if we backup the uncommited transfer in tablet // but the final result of the uncommited transfer in tablet is aborted, which means the tablet has no MDS Table, // and the restore process will create this tablet nontheless, however this aborted tablet should be GC-ed at the end, // because the aborted tablet has no MDS Table, the tablet can not be GC-ed correctly, resulting in the tablet dangling // for details, see issue-51990749 // we can skip backup uncommited transfer in tablets because we backup ls meta first // if the start transfer in transaction is not commited, the clog_checkpoint_scn recorded // in ls meta will not be advanced, so that even though we skip backup uncommited // transfer in tablet, we can still restore transfer in tablet by replaying clog LOG_WARN("tablet is transfer in but not commited, skip", K(tablet_handle), K(user_data)); continue; } else if (OB_FAIL(tablet->build_migration_tablet_param(tablet_info.param_))) { LOG_WARN("failed to build migration tablet param", K(ret)); } else if (OB_FAIL(tablet->get_ha_sstable_size(tablet_info.data_size_))) { LOG_WARN("failed to get sstable size", K(ret), KPC(tablet)); } else if (OB_FAIL(ObStorageHAUtils::get_server_version(tablet_info.version_))) { LOG_WARN("failed to get server version", K(ret), K(tablet_info)); } else { tablet_info.tablet_id_ = tablet->get_tablet_meta().tablet_id_; tablet_info.status_ = ObCopyTabletStatus::TABLET_EXIST; if (OB_FAIL(handle_tablet_meta_f(tablet_info))) { LOG_WARN("fail to handle tablet meta", K(ret), K(tablet_info)); } } } } } return ret; } int ObLSTabletService::ha_get_tablet( const common::ObTabletID &tablet_id, ObTabletHandle &handle) { int ret = OB_SUCCESS; bool is_empty_shell = false; ObTablet *tablet = nullptr; if (OB_FAIL(direct_get_tablet(tablet_id, handle))) { LOG_WARN("failed to get tablet", K(ret), K(tablet_id)); } else if (OB_ISNULL(tablet = handle.get_obj())) { ret = OB_ERR_UNEXPECTED; LOG_WARN("tablet should not be NULL", K(ret), K(tablet_id)); } else if (tablet->is_empty_shell()) { // treat empty shell as tablet not exist. ret = OB_TABLET_NOT_EXIST; } return ret; } int ObLSTabletService::check_real_leader_for_4377_(const ObLSID ls_id) { int ret = OB_SUCCESS; ObLSService* ls_srv = nullptr; ObLSHandle ls_handle; ObLS *ls = nullptr; int64_t epoch = 0; bool is_real_leader = false; if (OB_ISNULL(ls_srv = MTL(ObLSService*))) { ret = OB_ERR_UNEXPECTED; LOG_ERROR("MTL(ObLSService*) fail, MTL not init?", K(ret)); } else if (OB_FAIL(ls_srv->get_ls(ls_id, ls_handle, ObLSGetMod::TRANS_MOD))) { LOG_ERROR("ls_srv->get_ls() fail", KR(ret)); } else if (OB_ISNULL(ls = ls_handle.get_ls())) { ret = OB_ERR_UNEXPECTED; LOG_ERROR("invalid ls", KR(ret)); } else if (OB_FAIL(ls->get_tx_svr()->get_tx_ls_log_adapter()->get_role(is_real_leader, epoch))) { LOG_WARN("get replica status fail", K(ret), KPC(ls)); } else if (!is_real_leader) { ret = OB_NOT_MASTER; LOG_WARN("get follower status during 4377", K(ret), KPC(ls)); } return ret; } int ObLSTabletService::check_need_rollback_in_transfer_for_4377_(const transaction::ObTxDesc *tx_desc, ObTabletHandle &data_tablet_handle) { int ret = OB_SUCCESS; ObTabletCreateDeleteMdsUserData user_data; bool unused_committed_flag = false; if (OB_ISNULL(tx_desc)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("tx_desc is null when check 4377", K(ret)); } else if (OB_FAIL(data_tablet_handle.get_obj()->ObITabletMdsInterface::get_latest_tablet_status( user_data, unused_committed_flag))) { LOG_WARN("can not get the tablet status from ObITabletMdsInterface", K(ret)); } else { // ObTabletStatus tablet_status = user_data.tablet_status_; // CASE 1: tablet_status_ == NORMAL, means there's no transfer in progress right now. // If there's valid transfer_scn_, which means transfer has finished, we should check // whether the transaction started before transfer to avoid throwing incorrect 4377 // error. Otherwise, it's a normal case of 4377 check because no transfer has happened, // and we should still throw 4377 error. // // CASE 2: tablet_status_ == TRANSFER_OUT, means it's in transfer out progress. // CASE 2.1: transfer_scn_ is invalid, the transfer_scn_ is not backfilled, we still // read from origin tablet, if there's inconsistent, it should throw 4377 error // CASE 2.2: transfer_scn_ is valid, the transfer_scn_ is backfilled, it means that // tablet has started to transfer out. If it's the first transfer, we should // throw 4377 error, otherwise we should compare the transfer_scn_ with the tx_scn, // and decide to rollback the transaction or throw 4377 error. // However, we can not be sure about whether this transfer out is the first transfer or not. // So we consider all the transfer out status as not the first transfer here, to avoid // throwing the incorrect 4377 error. // // CASE 3: tablet_status_ == TRANSFER_IN, means it's in transfer in progress, and // the transfer out progress must have been finished. We can compare the transfer_scn_ // with the tx_scn directly because there should be valid transfer_scn_. // // Above all, we do not need to consider the status of tablet. if (user_data.transfer_scn_.is_valid()) { if (user_data.transfer_scn_.convert_to_ts() > tx_desc->get_active_ts()) { // TODO(yangyifei.yyf): active_ts is set by ObClockGenerator::get_clock, it's not a GTS. // And transfer_scn is set by redo_scn, it's incorrect to compare it with active_ts. // We should adjust this judgment later. ret = OB_TRANS_NEED_ROLLBACK; LOG_WARN("maybe meet transfer during kill tx, which can cause 4377 error, so we will rollback it", K(tx_desc), K(user_data)); } } else { // There's no transfer after trans begin, still throw 4377 error } } return ret; } int ObLSTabletService::check_parts_tx_state_in_transfer_for_4377_(transaction::ObTxDesc *tx_desc) { int ret = OB_SUCCESS; transaction::ObTransService *txs = MTL(transaction::ObTransService *); transaction::ObTxPartList copy_parts; bool is_alive = false; if (OB_ISNULL(tx_desc)) { ret = OB_ERR_UNEXPECTED; LOG_ERROR("tx_desc is null", K(ret)); } else if (OB_FAIL(tx_desc->get_parts_copy(copy_parts))) { TRANS_LOG(WARN, "get participants copy error", K(ret)); } else { // Although we can verify whether transaction data is incomplete due to the // transfer by checking the local tablet. While in the scenario where we // validate the index table through the main table, we cannot discover // whether the main table's txn data is incomplete due to the transfer by // using the local index table. Furthermore, the local index table and the // main table may not even locate on the same machine. // // Therefore, we choose to traverse all participant lists through RPC to // confirm whether the txn context that could potentially participate in the // transfer and has been terminated due to the transfer. In this scenario, // we consider the occurrence of 4377 as misreporting, and we convert it // into OB_TRANS_NEED_ROLLBACK to indicate the need to rollback the txn. for (int64_t i = 0; OB_SUCC(ret) && i < copy_parts.count(); i++) { ObLSID ls_id = copy_parts[i].id_; is_alive = false; if (OB_FAIL(txs->ask_tx_state_for_4377(ls_id, tx_desc->get_tx_id(), is_alive))) { TRANS_LOG(WARN, "fail to ask tx state for 4377", K(tx_desc)); } else if (!is_alive) { ret = OB_TRANS_NEED_ROLLBACK; LOG_WARN("maybe meet transfer during kill tx, which can cause 4377 error, so we will rollback it", K(tx_desc)); } } } return ret; } int ObLSTabletService::offline_build_tablet_without_memtable_() { int ret = OB_SUCCESS; ObArray tablet_id_array; const bool except_ls_inner_tablet = false; const SCN scn(SCN::max_scn()); if (OB_FAIL(get_all_tablet_ids(except_ls_inner_tablet, tablet_id_array))) { LOG_WARN("failed to get all tablet ids", K(ret)); } else { for (int64_t i = 0; OB_SUCC(ret) && i < tablet_id_array.count(); ++i) { const ObTabletID &tablet_id = tablet_id_array.at(i); if (OB_FAIL(update_tablet_release_memtable_for_offline(tablet_id, scn))) { LOG_WARN("failed to update tablet release memtable", K(ret), K(tablet_id)); } } } return ret; } int ObLSTabletService::offline_destroy_memtable_and_mds_table_() { int ret = OB_SUCCESS; DestroyMemtableAndMemberAndMdsTableOperator clean_mem_op(this); if (OB_FAIL(tablet_id_set_.foreach(clean_mem_op))) { LOG_WARN("fail to clean memtables", K(ret), "cur_tablet_id", clean_mem_op.cur_tablet_id_); } return ret; } } // namespace storage } // namespace oceanbase