/** * Copyright (c) 2021 OceanBase * OceanBase CE is licensed under Mulan PubL v2. * You can use this software according to the terms and conditions of the Mulan PubL v2. * You may obtain a copy of Mulan PubL v2 at: * http://license.coscl.org.cn/MulanPubL-2.0 * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. * See the Mulan PubL v2 for more details. */ #include #include #include #include "share/scn.h" #define private public #include "env/ob_simple_log_cluster_env.h" #undef private const std::string TEST_NAME = "test_rebuild"; using namespace oceanbase::common; using namespace oceanbase; namespace oceanbase { using namespace logservice; using namespace palf; namespace unittest { class TestObSimpleLogClusterRebuild : public ObSimpleLogClusterTestEnv { public: TestObSimpleLogClusterRebuild() : ObSimpleLogClusterTestEnv() {} public: class TestRebuildCbImpl : public PalfRebuildCb, public share::ObThreadPool { public: TestRebuildCbImpl(): test_base_(NULL), server_idx_(-1), rebuild_palf_id_(-1), rebuild_lsn_(), allow_rebuild_(false), is_inited_(false) {} virtual ~TestRebuildCbImpl() { destroy(); } public: int init(TestObSimpleLogClusterRebuild *ptr, const int64_t server_idx) { int ret = OB_SUCCESS; if (OB_ISNULL(ptr) || server_idx < 0 || server_idx >= ptr->get_member_cnt()) { ret = OB_INVALID_ARGUMENT; PALF_LOG(ERROR, "invalid_argument", KP(ptr), K(server_idx)); } else { test_base_ = ptr; server_idx_ = server_idx; is_inited_ = true; } return ret; } int start() { int ret = OB_SUCCESS; if (IS_NOT_INIT) { ret = OB_NOT_INIT; } else if (OB_FAIL(share::ObThreadPool::start())) { PALF_LOG(ERROR, "RebuildCB thread failed to start"); } else { PALF_LOG(INFO, "RebuildCB start success", K(ret)); } return ret; } void destroy() { is_inited_ = false; stop(); wait(); server_idx_ = -1; rebuild_palf_id_ = -1; rebuild_lsn_.reset(); allow_rebuild_ = false; test_base_ = NULL; } int on_rebuild(const int64_t id, const LSN &lsn) { int ret = OB_SUCCESS; if (!is_inited_) { ret = OB_NOT_INIT; } else if (id < 0 || !lsn.is_valid()) { ret = OB_INVALID_ARGUMENT; SERVER_LOG(ERROR, "invalid rebuild argument", K(server_idx_), K(id), K(lsn)); } else { rebuild_palf_id_ = id; rebuild_lsn_ = lsn; SERVER_LOG(INFO, "on_rebuild success", K(server_idx_), K(id), K(lsn)); } return ret; } void run1() { share::ObTenantBase tenant_base(OB_SYS_TENANT_ID); tenant_base.init(); ObTenantEnv::set_tenant(&tenant_base); lib::set_thread_name("RebuildCB"); while (!has_set_stop()) { if (true == allow_rebuild_ && rebuild_palf_id_ != -1 && rebuild_lsn_.is_valid()) { PalfHandleImplGuard leader; PalfHandleImplGuard *rebuild_palf; int64_t leader_idx; PalfBaseInfo rebuild_base_info; std::vector palf_list; EXPECT_EQ(OB_SUCCESS, test_base_->get_cluster_palf_handle_guard(rebuild_palf_id_, palf_list)); rebuild_palf = palf_list[server_idx_]; EXPECT_EQ(OB_SUCCESS, test_base_->get_leader(test_base_->palf_id_, leader, leader_idx)); EXPECT_EQ(OB_SUCCESS, rebuild_palf->palf_handle_impl_->disable_sync()); EXPECT_EQ(OB_SUCCESS, leader.palf_handle_impl_->get_base_info(rebuild_lsn_, rebuild_base_info)); EXPECT_EQ(OB_SUCCESS, rebuild_palf->palf_handle_impl_->advance_base_info(rebuild_base_info, true)); EXPECT_EQ(OB_SUCCESS, rebuild_palf->palf_handle_impl_->enable_sync()); rebuild_palf = NULL; test_base_->revert_cluster_palf_handle_guard(palf_list); rebuild_palf_id_ = -1; rebuild_lsn_.reset(); } SERVER_LOG(INFO, "RebuildCB", K(server_idx_)); usleep(500 * 1000); } } public: TestObSimpleLogClusterRebuild *test_base_; int64_t server_idx_; int64_t rebuild_palf_id_; LSN rebuild_lsn_; bool allow_rebuild_; bool is_inited_; }; }; int64_t ObSimpleLogClusterTestBase::member_cnt_ = 3; int64_t ObSimpleLogClusterTestBase::node_cnt_ = 3; std::string ObSimpleLogClusterTestBase::test_name_ = TEST_NAME; bool ObSimpleLogClusterTestBase::need_add_arb_server_ = false; TEST_F(TestObSimpleLogClusterRebuild, test_old_leader_rebuild) { SET_CASE_LOG_FILE(TEST_NAME, "old_leader_rebuild"); const int64_t id = ATOMIC_AAF(&palf_id_, 1); constexpr int64_t KB = 1024; constexpr int64_t MB = 1024 * 1024; PALF_LOG(INFO, "start test old_leader_rebuild", K(id)); int64_t leader_idx = 0; unittest::PalfHandleImplGuard leader; unittest::PalfHandleImplGuard *rebuild_server = NULL; std::vector palf_list; int64_t follower_idx1, follower_idx2; EXPECT_EQ(OB_SUCCESS, create_paxos_group(id, leader_idx, leader)); EXPECT_EQ(OB_SUCCESS, get_cluster_palf_handle_guard(id, palf_list)); follower_idx1 = (leader_idx + 1) % 3; follower_idx2 = (leader_idx + 2) % 3; TestRebuildCbImpl rebuild_cb; PalfRebuildCbNode rebuild_node(&rebuild_cb); EXPECT_EQ(OB_SUCCESS, rebuild_cb.init(this, leader_idx)); EXPECT_EQ(OB_SUCCESS, rebuild_cb.start()); // reigster rebuild cb rebuild_server = &leader; EXPECT_EQ(OB_SUCCESS, rebuild_server->palf_handle_impl_->register_rebuild_cb(&rebuild_node)); EXPECT_EQ(OB_SUCCESS, submit_log(leader, 1000, id, 6 * KB)); sleep(1); PALF_LOG(INFO, "begin block net", K(id), K(leader_idx), K(follower_idx1), K(follower_idx2)); block_net(leader_idx, follower_idx1); block_net(leader_idx, follower_idx2); submit_log(leader, 100, id, 6 * KB); PALF_LOG(INFO, "begin submit logs", K(id), K(leader_idx), K(follower_idx1), K(follower_idx2)); (void) submit_log(leader, 1000, leader_idx, MB); PALF_LOG(INFO, "after sleep 16s, begin get_leader", K(id), K(leader_idx), K(follower_idx1), K(follower_idx2)); int64_t new_leader_idx = 0; unittest::PalfHandleImplGuard new_leader; EXPECT_EQ(OB_SUCCESS, get_leader(id, new_leader, new_leader_idx)); PALF_LOG(INFO, "after get_leader", K(id), K(leader_idx), K(new_leader_idx)); // submit logs EXPECT_EQ(OB_SUCCESS, submit_log(new_leader, 64 * 6, id, MB)); // update new_leader's disk option, only reserves 4 * 80% log blocks, // that means 2 blocks will be recycled PALF_LOG(INFO, "begin advance_base_lsn", K(id), K(leader_idx), K(new_leader_idx)); LSN recycle_lsn(2 * PALF_BLOCK_SIZE); EXPECT_EQ(OB_SUCCESS, new_leader.palf_handle_impl_->set_base_lsn(recycle_lsn)); update_disk_options(new_leader_idx, 4); // recycle 2 block sleep(5); block_id_t leader_min_block_id; share::SCN min_scn; block_id_t min_block_id, max_block_id; while (true) { EXPECT_EQ(OB_SUCCESS, new_leader.palf_handle_impl_->get_min_block_info_for_gc(leader_min_block_id, min_scn)); // palf will reserve one more block if (1 ==leader_min_block_id) { break; } else { sleep(2); } } EXPECT_EQ(OB_SUCCESS, rebuild_server->palf_handle_impl_->log_engine_.get_block_id_range(min_block_id, max_block_id)); PALF_LOG_RET(ERROR, OB_ERR_UNEXPECTED, "runlin trace get_block_id_range", K(min_block_id), K(max_block_id)); // submit a cond task before unblocking net to stop truncating task IOTaskCond cond(id, rebuild_server->palf_env_impl_->last_palf_epoch_); LogIOWorker *io_worker = &rebuild_server->palf_env_impl_->log_io_worker_; io_worker->submit_io_task(&cond); // after unblocking net, old leader will do rebuild unblock_net(leader_idx, follower_idx1); unblock_net(leader_idx, follower_idx2); sleep(5); // is truncating, can not rebuild if (rebuild_server->palf_handle_impl_->sw_.is_truncating_) { PalfBaseInfo rebuild_base_info; EXPECT_EQ(OB_SUCCESS, new_leader.palf_handle_impl_->get_base_info(rebuild_cb.rebuild_lsn_, rebuild_base_info)); EXPECT_EQ(OB_SUCCESS, rebuild_server->palf_handle_impl_->disable_sync()); EXPECT_EQ(OB_EAGAIN, rebuild_server->palf_handle_impl_->advance_base_info(rebuild_base_info, true)); } cond.cond_.signal(); sleep(5); rebuild_cb.allow_rebuild_ = true; PalfBaseInfo base_info_in_leader; PalfBaseInfo base_info_after_rebuild; // check block_id block_id_t rebuild_server_min_block_id; // get block_id may be executed when all blocks are deleted, so wait for OB_SUCCESS while (OB_SUCCESS != rebuild_server->palf_handle_impl_->get_min_block_info_for_gc(rebuild_server_min_block_id, min_scn)) { sleep(1); } EXPECT_EQ(2, rebuild_server_min_block_id); // check base_lsn EXPECT_EQ(recycle_lsn, rebuild_server->palf_handle_impl_->log_engine_.get_log_meta().get_log_snapshot_meta().base_lsn_); EXPECT_EQ(OB_SUCCESS, new_leader.palf_handle_impl_->get_base_info(recycle_lsn, base_info_in_leader)); EXPECT_EQ(OB_SUCCESS, rebuild_server->palf_handle_impl_->get_base_info(recycle_lsn, base_info_after_rebuild)); // check prev_log_info EXPECT_EQ(base_info_in_leader.prev_log_info_, base_info_after_rebuild.prev_log_info_); LSN leader_end_lsn, rebuild_server_end_lsn; leader_end_lsn = new_leader.palf_handle_impl_->get_end_lsn(); rebuild_server_end_lsn = rebuild_server->palf_handle_impl_->get_end_lsn(); PALF_LOG(INFO, "rebuild result", K(leader_end_lsn), K(rebuild_server_end_lsn)); // EXPECT_EQ(OB_SUCCESS, delete_paxos_group(id)); revert_cluster_palf_handle_guard(palf_list); EXPECT_EQ(OB_SUCCESS, new_leader.palf_handle_impl_->set_base_lsn(LSN(64*6*MB))); sleep(1); EXPECT_EQ(OB_SUCCESS, update_disk_options(new_leader_idx, 40)); PALF_LOG(INFO, "end test old_leader_rebuild", K(id)); } TEST_F(TestObSimpleLogClusterRebuild, test_follower_rebuild) { SET_CASE_LOG_FILE(TEST_NAME, "follower_rebuild"); const int64_t id = ATOMIC_AAF(&palf_id_, 1); constexpr int64_t MB = 1024 * 1024; PALF_LOG(INFO, "start test follower_rebuild", K(id)); int64_t leader_idx = 0; unittest::PalfHandleImplGuard leader; unittest::PalfHandleImplGuard *rebuild_server = NULL; std::vector palf_list; int64_t follower_idx; EXPECT_EQ(OB_SUCCESS, create_paxos_group(id, leader_idx, leader)); EXPECT_EQ(OB_SUCCESS, get_cluster_palf_handle_guard(id, palf_list)); follower_idx = (leader_idx + 1) % 3; TestRebuildCbImpl rebuild_cb; rebuild_cb.allow_rebuild_ = true; PalfRebuildCbNode rebuild_node(&rebuild_cb); EXPECT_EQ(OB_SUCCESS, rebuild_cb.init(this, follower_idx)); EXPECT_EQ(OB_SUCCESS, rebuild_cb.start()); // reigster rebuild cb rebuild_server = palf_list[follower_idx]; EXPECT_EQ(OB_SUCCESS, rebuild_server->palf_handle_impl_->register_rebuild_cb(&rebuild_node)); // the follower is empty block_net(leader_idx, follower_idx); EXPECT_EQ(OB_SUCCESS, submit_log(leader, 64, leader_idx, MB)); EXPECT_EQ(OB_SUCCESS, submit_log(leader, 64 * 5, leader_idx, MB)); // recycle one block LSN recycle_lsn(2 * PALF_BLOCK_SIZE); EXPECT_EQ(OB_SUCCESS, leader.palf_handle_impl_->set_base_lsn(recycle_lsn)); update_disk_options(leader_idx, 4); sleep(1); block_id_t leader_min_block_id, follower_min_block_id; share::SCN min_scn; while (true) { EXPECT_EQ(OB_SUCCESS, leader.palf_handle_impl_->get_min_block_info_for_gc(leader_min_block_id, min_scn)); if (1 == leader_min_block_id) { break; } else { sleep(2); } } EXPECT_EQ(recycle_lsn, leader.palf_handle_impl_->log_engine_.get_log_meta().get_log_snapshot_meta().base_lsn_); // follower_idx will trigger rebuild when fetching log unblock_net(leader_idx, follower_idx); sleep(10); PalfBaseInfo base_info_in_leader; PalfBaseInfo base_info_after_rebuild; // check block_id EXPECT_EQ(OB_SUCCESS, rebuild_server->palf_handle_impl_->get_min_block_info_for_gc(follower_min_block_id, min_scn)); EXPECT_EQ(2, follower_min_block_id); // check base_lsn EXPECT_EQ(recycle_lsn, rebuild_server->palf_handle_impl_->log_engine_.get_log_meta().get_log_snapshot_meta().base_lsn_); EXPECT_EQ(OB_SUCCESS, leader.palf_handle_impl_->get_base_info(recycle_lsn, base_info_in_leader)); EXPECT_EQ(OB_SUCCESS, rebuild_server->palf_handle_impl_->get_base_info(recycle_lsn, base_info_after_rebuild)); // check prev_log_info EXPECT_EQ(base_info_in_leader.prev_log_info_, base_info_after_rebuild.prev_log_info_); LSN leader_end_lsn, rebuild_server_end_lsn; leader_end_lsn = leader.palf_handle_impl_->get_end_lsn(); rebuild_server_end_lsn = rebuild_server->palf_handle_impl_->get_end_lsn(); PALF_LOG(INFO, "rebuild result", K(leader_end_lsn), K(rebuild_server_end_lsn)); // EXPECT_EQ(OB_SUCCESS, delete_paxos_group(id)); revert_cluster_palf_handle_guard(palf_list); PALF_LOG(INFO, "end test follower_rebuild", K(id)); } } // end unittest } // end oceanbase int main(int argc, char **argv) { RUN_SIMPLE_LOG_CLUSTER_TEST(TEST_NAME); }