Files
oceanbase/tools/obcdc/src/ob_log_formatter.cpp
2022-03-25 18:10:38 +08:00

1510 lines
58 KiB
C++

/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX OBLOG_FORMATTER
#include "ob_log_formatter.h"
#include <BinLogBuf.h> // BinLogBuf
#include "share/schema/ob_table_schema.h" // TableSchemaType
#include "lib/string/ob_string.h" // ObString
#include "storage/transaction/ob_trans_define.h" // ObTransID
#include "ob_log_meta_manager.h" // IObLogMetaManager
#include "ob_log_utils.h" // obj2str
#include "ob_log_schema_getter.h" // IObLogSchemaGetter, DBSchemaInfo
#include "ob_log_instance.h" // IObLogErrHandler, TCTX
#include "ob_obj2str_helper.h" // ObObj2strHelper
#include "ob_log_trans_ctx_mgr.h" // IObLogTransCtxMgr
#include "ob_log_binlog_record_pool.h" // IObLogBRPool
#include "ob_log_storager.h" // IObLogStorager
#include "ob_log_tenant.h" // ObLogTenantGuard, ObLogTenant
#include "ob_log_config.h" // TCONF
using namespace oceanbase::common;
using namespace oceanbase::storage;
using namespace oceanbase::share::schema;
using namespace oceanbase::transaction;
namespace oceanbase
{
namespace liboblog
{
void ObLogFormatter::RowValue::reset()
{
column_num_ = 0;
contain_old_column_ = false;
new_column_array_ = NULL;
old_column_array_ = NULL;
(void)memset(new_columns_, 0, sizeof(new_columns_));
(void)memset(old_columns_, 0, sizeof(old_columns_));
(void)memset(orig_default_value_, 0, sizeof(orig_default_value_));
(void)memset(is_rowkey_, 0, sizeof(is_rowkey_));
(void)memset(is_changed_, 0, sizeof(is_changed_));
}
int ObLogFormatter::RowValue::init(const int64_t column_num, const bool contain_old_column)
{
column_num_ = column_num;
contain_old_column_ = contain_old_column;
new_column_array_ = NULL;
old_column_array_ = NULL;
if (column_num > 0) {
(void)memset(new_columns_, 0, column_num * sizeof(new_columns_[0]));
(void)memset(old_columns_, 0, column_num * sizeof(old_columns_[0]));
(void)memset(orig_default_value_, 0, column_num * sizeof(orig_default_value_[0]));
(void)memset(is_rowkey_, 0, column_num * sizeof(is_rowkey_[0]));
(void)memset(is_changed_, 0, column_num * sizeof(is_changed_[0]));
}
return OB_SUCCESS;
}
ObLogFormatter::ObLogFormatter() : inited_(false),
working_mode_(WorkingMode::UNKNOWN_MODE),
obj2str_helper_(NULL),
br_pool_(NULL),
err_handler_(NULL),
meta_manager_(NULL),
schema_getter_(NULL),
storager_(NULL),
row_value_array_(NULL),
allocator_(ObModIds::OB_LOG_FORMATTER, PAGE_SIZE),
round_value_(0),
skip_dirty_data_(false),
enable_hbase_mode_(false),
hbase_util_(NULL),
skip_hbase_mode_put_column_count_not_consistency_(false),
enable_output_hidden_primary_key_(false),
log_entry_task_count_(0)
{
}
ObLogFormatter::~ObLogFormatter()
{
destroy();
}
int ObLogFormatter::init(const int64_t thread_num,
const int64_t queue_size,
const WorkingMode working_mode,
ObObj2strHelper *obj2str_helper,
IObLogBRPool *br_pool,
IObLogMetaManager *meta_manager,
IObLogSchemaGetter *schema_getter,
IObLogStorager *storager,
IObLogErrHandler *err_handler,
const bool skip_dirty_data,
const bool enable_hbase_mode,
ObLogHbaseUtil &hbase_util,
const bool skip_hbase_mode_put_column_count_not_consistency,
const bool enable_output_hidden_primary_key)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(inited_)) {
LOG_ERROR("ObLogFormatter has been initialized");
ret = OB_INIT_TWICE;
} else if (OB_UNLIKELY(thread_num <= 0)
|| OB_UNLIKELY(queue_size <= 0)
|| OB_UNLIKELY(! is_working_mode_valid(working_mode))
|| OB_ISNULL(obj2str_helper)
|| OB_ISNULL(br_pool)
|| OB_ISNULL(meta_manager)
|| OB_ISNULL(schema_getter)
|| OB_ISNULL(storager)
|| OB_ISNULL(err_handler)) {
LOG_ERROR("invalid arguments", K(thread_num), K(queue_size), K(working_mode), K(obj2str_helper),
K(meta_manager), K(schema_getter), K(storager), K(err_handler));
ret = OB_INVALID_ARGUMENT;
} else if (OB_FAIL(FormatterThread::init(thread_num, queue_size))) {
LOG_ERROR("init formatter queue thread fail", KR(ret), K(thread_num), K(queue_size));
} else if (OB_FAIL(init_row_value_array_(thread_num))) {
LOG_ERROR("init_row_value_array_ fail", KR(ret), K(thread_num));
} else {
working_mode_ = working_mode;
obj2str_helper_ = obj2str_helper;
br_pool_ = br_pool;
err_handler_ = err_handler;
meta_manager_ = meta_manager;
schema_getter_ = schema_getter;
storager_ = storager;
round_value_ = 0;
skip_dirty_data_ = skip_dirty_data;
enable_hbase_mode_ = enable_hbase_mode;
hbase_util_ = &hbase_util;
skip_hbase_mode_put_column_count_not_consistency_ = skip_hbase_mode_put_column_count_not_consistency;
enable_output_hidden_primary_key_ = enable_output_hidden_primary_key;
log_entry_task_count_ = 0;
inited_ = true;
LOG_INFO("Formatter init succ", K(working_mode_), "working_mode", print_working_mode(working_mode_),
K(thread_num), K(queue_size));
}
return ret;
}
void ObLogFormatter::destroy()
{
FormatterThread::destroy();
inited_ = false;
destroy_row_value_array_();
working_mode_ = WorkingMode::UNKNOWN_MODE;
obj2str_helper_ = NULL;
br_pool_ = NULL;
row_value_array_ = NULL;
err_handler_ = NULL;
meta_manager_ = NULL;
schema_getter_ = NULL;
storager_ = NULL;
round_value_ = 0;
skip_dirty_data_ = false;
enable_hbase_mode_ = false;
hbase_util_ = NULL;
skip_hbase_mode_put_column_count_not_consistency_ = false;
enable_output_hidden_primary_key_ = false;
log_entry_task_count_ = 0;
}
int ObLogFormatter::start()
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_FAIL(FormatterThread::start())) {
LOG_ERROR("start formatter thread fail", KR(ret), "thread_num", get_thread_num());
} else {
LOG_INFO("start formatter threads succ", "thread_num", get_thread_num());
}
return ret;
}
void ObLogFormatter::stop()
{
if (inited_) {
FormatterThread::stop();
LOG_INFO("stop formatter threads succ", "thread_num", get_thread_num());
}
}
int ObLogFormatter::push(IStmtTask *stmt_task, volatile bool &stop_flag)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(stmt_task)) {
LOG_ERROR("invalid arguments", K(stmt_task));
ret = OB_INVALID_ARGUMENT;
} else {
// Ensure that all stmt of ObLogEntryTask are pushed to the same queue
const uint64_t hash_value = ATOMIC_FAA(&round_value_, 1);
int64_t stmt_count = 0;
while (OB_SUCC(ret) && NULL != stmt_task) {
IStmtTask *next = stmt_task->get_next();
void *push_task = static_cast<void *>(stmt_task);
RETRY_FUNC(stop_flag, *(static_cast<ObMQThread *>(this)), push, push_task, hash_value, DATA_OP_TIMEOUT);
if (OB_SUCC(ret)) {
stmt_task = next;
++stmt_count;
} else {
if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("push task into formatter fail", KR(ret), K(push_task), K(hash_value));
}
}
} // while
if (OB_SUCC(ret)) {
ATOMIC_INC(&log_entry_task_count_);
}
}
return ret;
}
int ObLogFormatter::get_task_count(int64_t &br_count,
int64_t &log_entry_task_count)
{
int ret = OB_SUCCESS;
br_count = 0;
log_entry_task_count = 0;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("parser has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_FAIL(get_total_task_num(br_count))) {
LOG_ERROR("get_total_task_num fail", KR(ret), K(br_count));
} else {
log_entry_task_count = ATOMIC_LOAD(&log_entry_task_count_);
}
return ret;
}
int ObLogFormatter::handle(void *data, const int64_t thread_index, volatile bool &stop_flag)
{
int ret = OB_SUCCESS;
ObLogBR *br = NULL;
ObLogSchemaGuard schema_guard;
DBSchemaInfo db_schema_info;
const TableSchemaType *table_schema = NULL;
IStmtTask *stmt_task = static_cast<IStmtTask *>(data);
DmlStmtTask *dml_stmt_task = dynamic_cast<DmlStmtTask *>(stmt_task);
RowValue *rv = row_value_array_ + thread_index;
int64_t new_column_cnt = 0;
bool is_ignore = false;
// Get the tenant schema: MYSQL or ORACLE
// To ensure the correctness of ObObj2strHelper::obj2str, you need to set the mysql or Oracle schema locally in the thread, there are two scenarios that depend on it:
// 1. set_meta_info_: first build local schema cache, depends on ObObj2strHelper
// 2. build_row_value_: formatting row data, relies on ObObj2strHelper
share::ObWorker::CompatMode compat_mode = share::ObWorker::CompatMode::INVALID;
const bool enable_formatter_print_log = (TCONF.enable_formatter_print_log != 0);
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(stmt_task)) {
LOG_ERROR("invalid arguments", K(stmt_task));
ret = OB_INVALID_ARGUMENT;
} else if (OB_UNLIKELY(! stmt_task->is_dml_stmt()) || OB_ISNULL(dml_stmt_task)) {
LOG_ERROR("stmt_task is not DML statement", "stmt_task", *stmt_task);
ret = OB_NOT_SUPPORTED;
} else if (OB_FAIL(init_binlog_record_for_dml_stmt_task_(dml_stmt_task, br, is_ignore))) {
LOG_ERROR("init_binlog_record_for_dml_stmt_task_ fail", KR(ret), K(dml_stmt_task), K(is_ignore));
} else if (is_ignore) {
br->set_is_valid(false);
}
// Collectively get Simple Schema
// Retry until exit or success
else if (OB_FAIL(get_schema_(
schema_getter_,
dml_stmt_task->get_table_version(),
dml_stmt_task->get_table_id(),
stop_flag,
schema_guard,
table_schema,
db_schema_info))) {
// Ignore the statement if the tenant was deleted, or the table was deleted or the get schema failed
if (OB_TENANT_HAS_BEEN_DROPPED == ret) {
LOG_INFO("[IGNORE_DATA] get schema error, tenant may be dropped",
"tenant_id", dml_stmt_task->get_tenant_id(),
"table_id", dml_stmt_task->get_table_id(),
"dml_stmt_task", *dml_stmt_task);
br->set_is_valid(false);
// reset ret
ret = OB_SUCCESS;
} else if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("get_schema_ fail", KR(ret), KPC(dml_stmt_task), K(table_schema));
}
}
// Failed to get table schema, table was deleted
// TODO: After the table is deleted, do some aftercare
else if (OB_ISNULL(table_schema)) {
if (enable_formatter_print_log) {
LOG_INFO("[IGNORE_DATA] get schema error, table may be dropped",
"table_id", dml_stmt_task->get_table_id(),
"dml_stmt_task", *dml_stmt_task);
} else if (REACH_TIME_INTERVAL(PRINT_LOG_INTERVAL)) {
LOG_INFO("[IGNORE_DATA] get schema error, table may be dropped",
"table_id", dml_stmt_task->get_table_id(),
"dml_stmt_task", *dml_stmt_task);
}
br->set_is_valid(false);
}
// Filter sys tables that are not user tables and are not in backup mode
else if (! table_schema->is_user_table()
&& ! BackupTableHelper::is_sys_table_exist_on_backup_mode(table_schema->is_sys_table(),
table_schema->get_table_id())) {
LOG_DEBUG("[IGNORE_DATA] ignore non-user table or sys table not exist on backup mode",
"table_name", table_schema->get_table_name(),
"table_id", table_schema->get_table_id(),
"table_type", ob_table_type_str(table_schema->get_table_type()));
br->set_is_valid(false);
}
// Ignore data from tables in the recycle bin
else if (table_schema->is_in_recyclebin() && ! is_backup_mode()) {
if (enable_formatter_print_log) {
LOG_INFO("[IGNORE_DATA] table is in recyclebin",
"table_id", dml_stmt_task->get_table_id(),
"is_backup_mode", is_backup_mode(),
KPC(dml_stmt_task));
} else if (REACH_TIME_INTERVAL(PRINT_LOG_INTERVAL)) {
LOG_INFO("[IGNORE_DATA] table is in recyclebin",
"table_id", dml_stmt_task->get_table_id(),
"is_backup_mode", is_backup_mode(),
KPC(dml_stmt_task));
}
br->set_is_valid(false);
} else if (OB_FAIL(get_tenant_compat_mode(table_schema->get_tenant_id(), compat_mode, stop_flag))) {
LOG_ERROR("get_tenant_compat_mode fail", KR(ret), "tenant_id", table_schema->get_tenant_id(),
"compat_mode", print_compat_mode(compat_mode), KPC(table_schema));
} else {
share::CompatModeGuard g(compat_mode);
if (OB_FAIL(set_meta_info_(schema_guard, table_schema, db_schema_info, br, stop_flag))) {
// Failed to get schema, ignore the data
if (OB_TENANT_HAS_BEEN_DROPPED == ret) {
LOG_INFO("[IGNORE_DATA] schema error when set_meta_info, tenant may be dropped", KR(ret),
"table_id", dml_stmt_task->get_table_id(), KPC(dml_stmt_task), K(db_schema_info));
br->set_is_valid(false);
ret = OB_SUCCESS;
} else if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("set_meta_info_ fail", KR(ret), K(table_schema), K(db_schema_info), K(br),
"compat_mode", print_compat_mode(compat_mode));
}
} else if (OB_FAIL(build_row_value_(rv, dml_stmt_task, table_schema, new_column_cnt))) {
LOG_ERROR("build_row_value_ fail", KR(ret), K(rv), "dml_stmt_task", *dml_stmt_task, K(new_column_cnt),
"compat_mode", print_compat_mode(compat_mode));
} else if (OB_FAIL(build_binlog_record_(br, rv, new_column_cnt, dml_stmt_task->get_dml_type(), table_schema))) {
LOG_ERROR("build_binlog_record_ fail", KR(ret), K(br), K(rv), K(new_column_cnt), KPC(dml_stmt_task));
} else {
if (OB_NOT_NULL(br->get_data()) &&
OB_UNLIKELY(SRC_FULL_RECORDED != br->get_data()->getSrcCategory())) {
// Handling non-full column logging modes: currently not support
handle_non_full_columns_(*dml_stmt_task, *table_schema);
if (skip_dirty_data_) {
ret = OB_SUCCESS;
} else {
// Do not ignore, requires full log, if not full log, exit with an error
ret = OB_NOT_SUPPORTED;
}
} else {
// do nothing
}
}
}
if (stop_flag) {
ret = OB_IN_STOP_STATE;
}
if (OB_SUCC(ret)) {
LOG_DEBUG("formatter handle task", K(thread_index), "stmt_task", *dml_stmt_task);
// Doing the finishing job
// Note: After this function call, neither the partition transaction nor the statement task can be referenced anymore and may be recycled at any time
if (OB_FAIL(finish_format_(stmt_task->get_host(), dml_stmt_task->get_redo_log_entry_task(), stop_flag))) {
if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("finish_format_ fail", KR(ret));
}
}
}
// Failure to withdraw
if (OB_SUCCESS != ret && OB_IN_STOP_STATE != ret && NULL != err_handler_) {
err_handler_->handle_error(ret, "formatter thread exits, thread_index=%ld, err=%d",
thread_index, ret);
stop_flag = true;
}
return ret;
}
int ObLogFormatter::init_binlog_record_for_dml_stmt_task_(DmlStmtTask *stmt_task,
ObLogBR *&br,
bool &is_ignore)
{
int ret = OB_SUCCESS;
is_ignore = false;
ObLogRowDataIndex *row_data_index = NULL;
ObLogEntryTask *log_entry_task = NULL;
bool is_rollback = false;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(stmt_task)) {
LOG_ERROR("invalid arguments", K(stmt_task));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(row_data_index = &(stmt_task->get_row_data_index()))) {
LOG_ERROR("row_data_index is NULL", KPC(stmt_task));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(log_entry_task = &(stmt_task->get_redo_log_entry_task()))) {
LOG_ERROR("log_entry_task is NULL", KPC(stmt_task));
ret = OB_INVALID_ARGUMENT;
} else if (OB_FAIL(br_pool_->alloc(false/*is_serilized*/, br, row_data_index, log_entry_task))) {
LOG_ERROR("alloc binlog record from pool fail", KR(ret), K(stmt_task));
} else if (OB_ISNULL(br)) {
LOG_ERROR("alloc binlog record fail", K(br));
ret = OB_ERR_UNEXPECTED;
} else {
is_rollback = row_data_index->is_rollback();
// select ... for update to record T_DML_LOCK log to prevent loss of row lock information on the standby machine in the event of a master/standby switchover, no synchronization required
if (T_DML_LOCK == stmt_task->get_dml_type()) {
is_ignore = true;
} else if (is_rollback) {
is_ignore = true;
} else {
RecordType type = get_record_type(stmt_task->get_dml_type());
const uint64_t tenant_id = extract_tenant_id(stmt_task->get_host().get_partition().get_table_id());
if (OB_FAIL(br->init_dml_data_first(type, tenant_id))) {
LOG_ERROR("br init_dml_data_first fail", KR(ret), K(type), K(tenant_id), K(*stmt_task));
} else {
LOG_DEBUG("br init_dml_data succ", KR(ret), K(type), K(tenant_id), K(stmt_task), K(*stmt_task));
}
}
if (OB_SUCC(ret)) {
row_data_index->set_binlog_record(br);
}
}
if (OB_FAIL(ret)) {
if (NULL != br) {
br_pool_->free(br);
br = NULL;
}
}
return ret;
}
void ObLogFormatter::handle_non_full_columns_(DmlStmtTask &dml_stmt_task,
const TableSchemaType &table_schema)
{
PartTransTask &task = dml_stmt_task.get_host();
if (! skip_dirty_data_) {
LOG_ERROR("row data is not full recorded",
"pkey", task.get_partition(),
"prepare_log_id", task.get_prepare_log_id(),
"timestamp", task.get_timestamp(),
"dml_type", dml_stmt_task.get_dml_type(),
"dml_type_str", print_dml_type(dml_stmt_task.get_dml_type()),
"table_name", table_schema.get_table_name(),
"table_id", table_schema.get_table_id(),
K(dml_stmt_task));
}
}
int ObLogFormatter::finish_format_(PartTransTask &part_trans_task,
ObLogEntryTask &redo_log_entry_task,
volatile bool &stop_flag)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
ret = OB_NOT_INIT;
} else {
const int64_t stmt_num = redo_log_entry_task.get_stmt_num();
int64_t formatted_stmt_num = redo_log_entry_task.inc_formatted_stmt_num();
const bool is_all_stmt_formatted = formatted_stmt_num >= stmt_num;
const uint64_t tenant_id = part_trans_task.get_tenant_id();
if (is_all_stmt_formatted) {
if (OB_FAIL(redo_log_entry_task.link_row_list())) {
if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("redo_log_entry_task link_row_list fail", KR(ret), K(redo_log_entry_task));
}
} else {
LOG_DEBUG("[FORMATT]", K(tenant_id), K(stmt_num), K(redo_log_entry_task), K(part_trans_task));
if (is_memory_working_mode(working_mode_)) {
if (OB_FAIL(handle_memory_data_sync_work_mode_(part_trans_task, redo_log_entry_task, stop_flag))) {
if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("handle_memory_data_sync_work_mode_ fail", KR(ret), K(part_trans_task), K(redo_log_entry_task));
}
}
} else if (is_storage_working_mode(working_mode_)) {
if (OB_FAIL(handle_storage_data_sync_work_mode_(part_trans_task, redo_log_entry_task, stop_flag))) {
if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("handle_storage_data_sync_work_mode_ fail", KR(ret), K(part_trans_task), K(redo_log_entry_task));
}
}
} else {
ret = OB_NOT_SUPPORTED;
}
}
if (OB_SUCC(ret)) {
ATOMIC_DEC(&log_entry_task_count_);
}
} else {
// do nothing
}
}
return ret;
}
int ObLogFormatter::handle_memory_data_sync_work_mode_(PartTransTask &part_trans_task,
ObLogEntryTask &log_entry_task,
volatile bool &stop_flag)
{
int ret = OB_SUCCESS;
bool is_unserved_part_trans_task_can_be_recycled = false;
if (OB_FAIL(part_trans_task.handle_log_entry_task_callback(ObLogEntryTask::FORMATTER_CB,
log_entry_task,
is_unserved_part_trans_task_can_be_recycled))) {
LOG_ERROR("handle_log_entry_task_callback fail", KR(ret), K(log_entry_task), K(part_trans_task), K(stop_flag));
} else if (is_unserved_part_trans_task_can_be_recycled) {
LOG_DEBUG("handle_log_entry_task_callback: part_trans_task is revert", K(part_trans_task));
part_trans_task.revert();
} else {}
return ret;
}
int ObLogFormatter::handle_storage_data_sync_work_mode_(PartTransTask &part_trans_task,
ObLogEntryTask &redo_log_entry_task,
volatile bool &stop_flag)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_FAIL(dispatch_to_storager_(redo_log_entry_task, stop_flag))) {
if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("dispatch_to_storager_ fail", KR(ret), K(redo_log_entry_task), K(part_trans_task));
}
} else {
// succ
}
return ret;
}
int ObLogFormatter::dispatch_to_storager_(ObLogEntryTask &log_entry_task,
volatile bool &stop_flag)
{
int ret = OB_SUCCESS;
if (OB_ISNULL(storager_)) {
LOG_ERROR("storager_ is NULL");
ret = OB_ERR_UNEXPECTED;
} else {
RETRY_FUNC(stop_flag, (*storager_), push, log_entry_task, DATA_OP_TIMEOUT);
}
return ret;
}
// @retval OB_SUCCESS success
// @retval OB_TENANT_HAS_BEEN_DROPPED tenant dropped
// #retval other error code fail
int ObLogFormatter::set_meta_info_(ObLogSchemaGuard &schema_guard,
const TableSchemaType *&simple_table_schema,
const DBSchemaInfo &db_schema_info,
ObLogBR *br,
volatile bool &stop_flag)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(simple_table_schema) || OB_UNLIKELY(! db_schema_info.is_valid()) || OB_ISNULL(br)) {
LOG_ERROR("invalid argument", K(simple_table_schema), K(br), K(db_schema_info));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(meta_manager_) || OB_ISNULL(schema_getter_)) {
LOG_ERROR("meta_manager_ or schema_getter_ is null", K(meta_manager_), K(schema_getter_));
ret = OB_ERR_UNEXPECTED;
} else {
IDBMeta *db_meta = NULL;
ITableMeta *table_meta = NULL;
if (OB_FAIL(meta_manager_->get_table_meta(simple_table_schema, *schema_getter_, table_meta, stop_flag))
|| NULL == table_meta) {
if (OB_TENANT_HAS_BEEN_DROPPED == ret) {
LOG_WARN("schema error when get_table_meta, tenant may by dropped", KR(ret),
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name());
} else if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("get_table_meta fail", KR(ret), "table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(), KPC(simple_table_schema), K(table_meta));
ret = OB_SUCCESS == ret ? OB_ERR_UNEXPECTED : ret;
}
} else if (OB_FAIL(meta_manager_->get_db_meta(db_schema_info, schema_guard, db_meta, stop_flag))
|| NULL == db_meta) {
if (OB_TENANT_HAS_BEEN_DROPPED == ret) {
LOG_WARN("schema error when get_db_meta, tenant may by dropped", KR(ret),
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
K(db_schema_info));
} else if (OB_IN_STOP_STATE != ret) {
LOG_ERROR("get_db_meta fail", KR(ret),
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
K(db_schema_info));
ret = OB_SUCCESS == ret ? OB_ERR_UNEXPECTED : ret;
}
} else if (OB_FAIL(br->set_table_meta(table_meta))) {
LOG_ERROR("set_table_meta fail", KR(ret), K(br), K(table_meta));
} else if (OB_FAIL(br->set_db_meta(db_meta))) {
LOG_ERROR("set_db_meta fail", KR(ret), K(br), K(db_meta));
} else {
// success
}
if (OB_SUCCESS != ret) {
if (NULL != table_meta) {
meta_manager_->revert_table_meta(table_meta);
table_meta = NULL;
}
if (NULL != db_meta) {
meta_manager_->revert_db_meta(db_meta);
db_meta = NULL;
}
}
}
return ret;
}
int ObLogFormatter::init_row_value_array_(const int64_t row_value_num)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(row_value_num <= 0)) {
LOG_ERROR("invalid argument", K(row_value_num));
ret = OB_INVALID_ARGUMENT;
} else {
int64_t size = sizeof(RowValue) * row_value_num;
void *ptr = allocator_.alloc(size);
if (NULL == (row_value_array_ = static_cast<RowValue *>(ptr))) {
LOG_ERROR("allocate memory for RowValue fail", K(size), K(row_value_num));
ret = OB_ALLOCATE_MEMORY_FAILED;
} else {
for (int64_t index = 0; index < row_value_num; index++) {
row_value_array_[index].reset();
}
}
}
return ret;
}
void ObLogFormatter::destroy_row_value_array_()
{
if (NULL != row_value_array_) {
allocator_.free(static_cast<void *>(row_value_array_));
row_value_array_ = NULL;
}
}
int ObLogFormatter::build_row_value_(RowValue *rv,
DmlStmtTask *stmt_task,
const TableSchemaType *simple_table_schema,
int64_t &new_column_cnt)
{
int ret = OB_SUCCESS;
ColValueList *rowkey_cols = NULL;
ColValueList *new_cols = NULL;
ColValueList *old_cols = NULL;
int64_t column_num = 0;
TableSchemaInfo *tb_schema_info = NULL;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(rv) || OB_ISNULL(stmt_task) || OB_ISNULL(simple_table_schema)) {
LOG_ERROR("invalid argument", K(rv), K(stmt_task), K(simple_table_schema));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(meta_manager_)) {
LOG_ERROR("meta_manager_ is null", K(meta_manager_));
ret = OB_ERR_UNEXPECTED;
} else if (OB_FAIL(meta_manager_->get_table_schema_meta(simple_table_schema->get_schema_version(),
simple_table_schema->get_table_id(), tb_schema_info))) {
LOG_ERROR("meta_manager_ get_table_schema_meta fail", KR(ret),
"version", simple_table_schema->get_schema_version(),
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(), KPC(tb_schema_info));
} else if (OB_ISNULL(tb_schema_info)) {
LOG_ERROR("tb_schema_info is null", K(tb_schema_info));
ret = OB_ERR_UNEXPECTED;
} else {
column_num = tb_schema_info->get_non_hidden_column_count();
if (column_num <= 0) {
LOG_INFO("no valid column is found", "table_name", simple_table_schema->get_table_name(),
"table_id", simple_table_schema->get_table_id());
} else if (OB_FAIL(stmt_task->parse_cols(obj2str_helper_, simple_table_schema, tb_schema_info,
enable_output_hidden_primary_key_))) {
LOG_ERROR("stmt_task.parse_cols fail", KR(ret), K(*stmt_task), K(obj2str_helper_),
KPC(simple_table_schema), KPC(tb_schema_info),
K(enable_output_hidden_primary_key_));
} else if (OB_FAIL(stmt_task->get_cols(&rowkey_cols, &new_cols, &old_cols))) {
LOG_ERROR("get_cols fail", KR(ret), K(*stmt_task));
} else if (OB_ISNULL(rowkey_cols) || OB_ISNULL(new_cols) || OB_ISNULL(old_cols)) {
LOG_ERROR("get_cols fail", K(rowkey_cols), K(new_cols), K(old_cols));
ret = OB_ERR_UNEXPECTED;
}
// NOTE: Logic for determining whether an old value is included: the data in the old value is not empty
else if (OB_FAIL(rv->init(column_num, old_cols->num_ > 0))) {
LOG_ERROR("init RowValue fail", KR(ret), K(column_num));
}
// fill new column value
else if (OB_FAIL(fill_normal_cols_(rv, *new_cols, simple_table_schema, *tb_schema_info, true))) {
LOG_ERROR("fill normal new columns fail", KR(ret), K(rv), KPC(new_cols));
}
// fill old column value
else if (OB_FAIL(fill_normal_cols_(rv, *old_cols, simple_table_schema, *tb_schema_info, false))) {
LOG_ERROR("fill normal old columns fail", KR(ret), K(rv), KPC(old_cols));
} else if (OB_FAIL(fill_rowkey_cols_(rv, *rowkey_cols, simple_table_schema,
*tb_schema_info))) {
LOG_ERROR("fill_rowkey_cols_ fail", KR(ret), K(rv), KPC(rowkey_cols),
"stmt_task", *stmt_task, K(simple_table_schema));
} else if (OB_FAIL(fill_orig_default_value_(rv, simple_table_schema, *tb_schema_info,
stmt_task->get_redo_log_entry_task().get_allocator()))) {
LOG_ERROR("fill_orig_default_value_ fail", KR(ret), K(rv), K(simple_table_schema));
} else {
new_column_cnt = new_cols->num_;
int64_t column_array_size = sizeof(BinLogBuf) * column_num;
BinLogBuf *new_column_array =
static_cast<BinLogBuf *>(stmt_task->get_redo_log_entry_task().alloc(column_array_size));
BinLogBuf *old_column_array =
static_cast<BinLogBuf *>(stmt_task->get_redo_log_entry_task().alloc(column_array_size));
if (OB_ISNULL(new_column_array) || OB_ISNULL(old_column_array)) {
LOG_ERROR("allocate memory for column array fail", K(column_array_size), K(column_num));
ret = OB_ALLOCATE_MEMORY_FAILED;
} else {
rv->new_column_array_ = new_column_array;
rv->old_column_array_ = old_column_array;
}
}
}
return ret;
}
int ObLogFormatter::fill_normal_cols_(RowValue *rv,
ColValueList &cv_list,
const TableSchemaType *simple_table_schema,
const TableSchemaInfo &tb_schema_info,
const bool is_new_value)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(rv) || OB_ISNULL(simple_table_schema)) {
LOG_ERROR("invalid argument", K(rv), K(simple_table_schema));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(meta_manager_)) {
LOG_ERROR("meta_manager_ is null", K(meta_manager_));
ret = OB_ERR_UNEXPECTED;
} else {
ColValue *cv = cv_list.head_;
int64_t table_schema_version = simple_table_schema->get_schema_version();
uint64_t table_id = simple_table_schema->get_table_id();
while (OB_SUCCESS == ret && NULL != cv) {
const uint64_t column_id = cv->column_id_;
ColumnSchemaInfo *column_schema_info = NULL;
int64_t column_index = -1;
ColumnPropertyFlag column_property_flag;
if (OB_FAIL(tb_schema_info.get_column_schema_info(column_id, enable_output_hidden_primary_key_,
column_schema_info, column_property_flag))) {
LOG_ERROR("get_column_schema_info fail", KR(ret), K(table_schema_version), K(table_id),
"table_name", simple_table_schema->get_table_name(),
K(column_id), K(enable_output_hidden_primary_key_),
K(column_schema_info), K(column_property_flag));
} else if (OB_UNLIKELY(column_property_flag.is_non_user())) {
// formatter should not process to non-user columns
LOG_ERROR("handle non user column, unexpected", K(column_property_flag),
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
// requires that the column must exist and is not a hidden column
// This logic is guaranteed when constructing the column values
} else if (OB_UNLIKELY(column_property_flag.is_delete())
|| OB_UNLIKELY(column_property_flag.is_hidden()
|| OB_UNLIKELY(column_property_flag.is_invisible()))) {
LOG_ERROR("column is invalid. column does not exist or "
"hidden or invisible column is not filtered", K(column_property_flag),
"table", simple_table_schema->get_table_name(),
"column_id", cv->column_id_,
"table_schema_version", simple_table_schema->get_schema_version());
ret = OB_ERR_UNEXPECTED;
} else if (OB_ISNULL(column_schema_info)) {
LOG_ERROR("column_schema_info is null", K(column_schema_info));
ret = OB_ERR_UNEXPECTED;
} else {
column_index = column_schema_info->get_column_idx();
if (OB_UNLIKELY(column_index < 0 || column_index >= OB_MAX_COLUMN_NUMBER)) {
LOG_ERROR("column_index is invalid", "table_name", simple_table_schema->get_table_name(),
K(column_index),
"column_id", cv->column_id_, K(OB_MAX_COLUMN_NUMBER));
ret = OB_ERR_UNEXPECTED;
} else {
if (is_new_value) {
rv->new_columns_[column_index] = &cv->string_value_;
rv->is_changed_[column_index] = true;
} else {
rv->old_columns_[column_index] = &cv->string_value_;
}
}
}
if (OB_SUCCESS == ret) {
cv = cv->next_;
}
} // while
}
return ret;
}
int ObLogFormatter::fill_rowkey_cols_(RowValue *rv,
ColValueList &rowkey_cols,
const TableSchemaType *simple_table_schema,
const TableSchemaInfo &tb_schema_info)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(rv) || OB_ISNULL(simple_table_schema)) {
LOG_ERROR("invalid argument", K(rv), K(simple_table_schema));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(meta_manager_)) {
LOG_ERROR("meta_manager_ is null", K(meta_manager_));
ret = OB_ERR_UNEXPECTED;
} else {
ColValue *cv_node = rowkey_cols.head_;
int64_t rowkey_count = rowkey_cols.num_;
int64_t table_schema_version = simple_table_schema->get_schema_version();
uint64_t table_id = simple_table_schema->get_table_id();
for (int64_t index = 0;
OB_SUCCESS == ret && index < rowkey_count;
index++, cv_node = cv_node->next_) {
uint64_t column_id = cv_node->column_id_;
int64_t column_index = -1;
ColumnSchemaInfo *column_schema_info = NULL;
ColumnPropertyFlag column_property_flag;
if (OB_ISNULL(cv_node)) {
LOG_ERROR("column value node is NULL", K(index), K(rowkey_count), K(cv_node));
ret = OB_INVALID_DATA;
} else if (OB_FAIL(tb_schema_info.get_column_schema_info(column_id, enable_output_hidden_primary_key_,
column_schema_info, column_property_flag))) {
LOG_ERROR("get_column_schema_info fail", KR(ret), K(table_schema_version), K(table_id),
"table_name", simple_table_schema->get_table_name(),
K(column_id), K(enable_output_hidden_primary_key_),
K(column_schema_info), K(column_property_flag));
} else if (OB_UNLIKELY(column_property_flag.is_non_user())) {
// formatter should not be processed to non-user columns
LOG_ERROR("handle non user column, unexpected", K(column_property_flag),
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (OB_UNLIKELY(column_property_flag.is_delete())) {
// Do not allow primary keys to not exist
LOG_ERROR("rowkey column does not exist", K(column_property_flag),
"table_id", simple_table_schema->get_table_id(),
"table", simple_table_schema->get_table_name(),
"table_schema_version", simple_table_schema->get_schema_version(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
}
// Hidden primary keys should already be filtered
else if (OB_UNLIKELY(column_property_flag.is_hidden())) {
LOG_ERROR("hidden rowkey column is not filtered", K(column_property_flag),
"table_id", simple_table_schema->get_table_id(),
"table", simple_table_schema->get_table_name(),
"table_schema_version", simple_table_schema->get_schema_version(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (column_schema_info->is_invisible()) {
// not possible for invisible column
LOG_ERROR("is_invisible column unexpected", "table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
"table_schema_version", simple_table_schema->get_schema_version(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (OB_ISNULL(column_schema_info)) {
LOG_ERROR("column_schema_info is null", K(column_schema_info));
ret = OB_ERR_UNEXPECTED;
} else {
column_index = column_schema_info->get_column_idx();
if (OB_UNLIKELY(column_index < 0 || column_index >= OB_MAX_COLUMN_NUMBER)) {
LOG_ERROR("column_index is invalid", "table_name", simple_table_schema->get_table_name(),
K(column_index), K(column_id));
ret = OB_ERR_UNEXPECTED;
} else {
// If the primary key column has been modified, the value after the modification is used, otherwise the value before the modification is used
if (NULL == rv->new_columns_[column_index]) {
rv->new_columns_[column_index] = &(cv_node->string_value_);
}
rv->is_rowkey_[column_index] = column_schema_info->is_rowkey();
rv->is_changed_[column_index] = true;
if (rv->contain_old_column_ && NULL == rv->old_columns_[column_index]) {
rv->old_columns_[column_index] = &(cv_node->string_value_);
}
}
}
} // for
}
return ret;
}
int ObLogFormatter::fill_orig_default_value_(RowValue *rv,
const TableSchemaType *simple_table_schema,
const TableSchemaInfo &tb_schema_info,
common::ObIAllocator &allocator)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(rv) || OB_ISNULL(simple_table_schema)) {
LOG_ERROR("invalid argument", K(rv), K(simple_table_schema));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(meta_manager_)) {
LOG_ERROR("meta_manager_ is null", K(meta_manager_));
ret = OB_ERR_UNEXPECTED;
} else {
int64_t real_column_index = 0;
int64_t column_count = rv->column_num_;
int64_t table_schema_version = simple_table_schema->get_schema_version();
uint64_t table_id = simple_table_schema->get_table_id();
for (int64_t index = 0; OB_SUCCESS == ret && index < column_count; index++) {
uint64_t column_id = OB_INVALID_ID;
ColumnSchemaInfo *column_schema_info = NULL;
ColumnPropertyFlag column_property_flag;
// 1. where column_count does not contain the number of hidden columns, it is obtained directly from RowValue
// 2. get the column_idx of the specified version of table-column_idx directly from the meta_manager,
// Ensure that the order of the columns in the oblog output is the same as the order of the columns defined in the OB table (add columns at the specified position)
if (OB_FAIL(tb_schema_info.get_column_id(index, column_id))) {
LOG_ERROR("tb_schema_info get_column_id fail", KR(ret), K(index), K(column_id));
} else if (OB_UNLIKELY(OB_INVALID_ID == column_id)) {
LOG_ERROR("column_id is not valid", K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (OB_FAIL(tb_schema_info.get_column_schema_info(column_id, enable_output_hidden_primary_key_,
column_schema_info, column_property_flag))) {
LOG_ERROR("get_column_schema_info fail", KR(ret), K(index), K(column_count), K(table_schema_version),
K(table_id), "table_name", simple_table_schema->get_table_name(),
K(column_id), K(enable_output_hidden_primary_key_),
K(column_schema_info), K(column_property_flag));
} else if (OB_UNLIKELY(column_property_flag.is_non_user())) {
// formatter should not be processed to non-user columns
LOG_ERROR("handle non user column, unexpected", K(column_property_flag),
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
"table_schema_version", simple_table_schema->get_schema_version(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (OB_UNLIKELY(column_property_flag.is_delete())) {
// not possible for delete column
LOG_ERROR("is_delete column unexpected", "table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
"table_schema_version", simple_table_schema->get_schema_version(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (column_schema_info->is_hidden()) {
// not possible for hidden column
LOG_ERROR("is_hidden column unexpected", "table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
"table_schema_version", simple_table_schema->get_schema_version(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (column_schema_info->is_invisible()) {
// not possible for invisible column
LOG_ERROR("is_invisible column unexpected", "table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
"table_schema_version", simple_table_schema->get_schema_version(),
K(column_id));
ret = OB_ERR_UNEXPECTED;
} else if (OB_ISNULL(column_schema_info)) {
LOG_ERROR("column_schema_info is null", K(column_schema_info));
ret = OB_ERR_UNEXPECTED;
} else {
// Determine if it is a newly added column, if it is a newly added column, then fill in the original default value
// If neither the new value nor the old value has a value, then it must be a newly added column
if (NULL != rv->new_columns_[real_column_index]
|| NULL != rv->old_columns_[real_column_index]) {
rv->orig_default_value_[real_column_index] = NULL;
} else {
// default vlaue
const common::ObString *orig_default_value_str = column_schema_info->get_orig_default_value_str();
ObString *str = static_cast<ObString *>(allocator.alloc(sizeof(ObString)));
if (OB_ISNULL(str)) {
LOG_ERROR("allocate memory for ObString fail", K(sizeof(ObString)));
ret = OB_ALLOCATE_MEMORY_FAILED;
} else if (OB_ISNULL(orig_default_value_str)) {
LOG_ERROR("orig_default_value_str is null", K(index),
K(table_id), "table_name", simple_table_schema->get_table_name(),
K(column_id), KPC(column_schema_info));
ret = OB_ERR_UNEXPECTED;
// For varchar:
// 1. the default value is NULL, which should be set to NULL
// 2. The default value is an empty string, which should be set to ''
} else if (NULL == orig_default_value_str->ptr()
&& 0 == orig_default_value_str->length()) {
new (str) ObString();
} else if (NULL != orig_default_value_str->ptr()
&& 0 == orig_default_value_str->length()) {
// Empty strings do not require memcpy
new (str) ObString();
str->assign_ptr(ObObj2strHelper::EMPTY_STRING, static_cast<ObString::obstr_size_t>(0));
} else {
const int64_t length = orig_default_value_str->length();
const char *ptr = orig_default_value_str->ptr();
char *ptr_copy = NULL;
if (OB_ISNULL(ptr_copy = static_cast<char *>(allocator.alloc(length)))) {
LOG_ERROR("allocate memory fail", K(length));
ret = OB_ALLOCATE_MEMORY_FAILED;
} else {
MEMCPY(ptr_copy, ptr, length);
new (str) ObString(length, ptr_copy);
}
}
if (OB_SUCC(ret)) {
rv->orig_default_value_[real_column_index] = str;
LOG_DEBUG("cast column orig default value",
"casted", *str,
"table_id", simple_table_schema->get_table_id(),
"table_name", simple_table_schema->get_table_name(),
K(real_column_index), K(index));
}
}
real_column_index++;
}
}
}
return ret;
}
int ObLogFormatter::set_src_category_(ILogRecord *br_data,
RowValue *rv,
const ObRowDml &dml_type,
const bool is_hbase_mode_put)
{
int ret = OB_SUCCESS;
if (OB_ISNULL(br_data) || OB_ISNULL(rv)) {
LOG_ERROR("invalid argument", K(br_data), K(rv));
ret = OB_INVALID_ARGUMENT;
} else {
int src_category = SRC_NO;
// 1. INSERT statements are always set to full column log format
// 2. DELETE and UPDATE must be populated with old values in full column logging mode, so if they are populated with old values, they are in full column logging format
// 3. OB-HBase mode put special handling
if (T_DML_INSERT == dml_type || rv->contain_old_column_ || is_hbase_mode_put) {
src_category = SRC_FULL_RECORDED;
} else {
src_category = SRC_FULL_FAKED;
}
br_data->setSrcCategory(src_category);
}
return ret;
}
int ObLogFormatter::build_binlog_record_(ObLogBR *br,
RowValue *rv,
const int64_t new_column_cnt,
const ObRowDml &dml_type,
const TableSchemaType *simple_table_schema)
{
int ret = OB_SUCCESS;
ILogRecord *br_data = NULL;
bool is_hbase_mode_put = false;
const uint64_t table_id = simple_table_schema->get_table_id();
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(br) || OB_ISNULL(rv) || OB_ISNULL(simple_table_schema)) {
LOG_ERROR("invalid argument", K(br), K(rv), K(simple_table_schema));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(br_data = br->get_data())) {
LOG_ERROR("binlog record data is invalid", K(br));
ret = OB_INVALID_ARGUMENT;
} else if (OB_ISNULL(rv->new_column_array_) || OB_ISNULL(rv->old_column_array_)) {
LOG_ERROR("invalid row value, new_column_array or old_column_array is invalid",
K(rv->new_column_array_), K(rv->old_column_array_));
ret = OB_INVALID_ARGUMENT;
} else if (OB_FAIL(is_hbase_mode_put_(table_id, dml_type, rv->column_num_, new_column_cnt,
rv->contain_old_column_, is_hbase_mode_put))) {
LOG_ERROR("is_hbase_mode_put_ fail", KR(ret), K(table_id), "dml_type", print_dml_type(dml_type),
"column_num", rv->column_num_,
K(new_column_cnt),
"contain_old_column", rv->contain_old_column_,
K(is_hbase_mode_put));
} else if (OB_FAIL(set_src_category_(br_data, rv, dml_type, is_hbase_mode_put))) {
LOG_ERROR("set_src_category_ fail", KR(ret), K(br_data), K(rv), K(dml_type), K(is_hbase_mode_put));
} else {
// default to be valid
br->set_is_valid(true);
if (rv->column_num_ <= 0) {
LOG_INFO("ignore non-user-column table", "table_name", simple_table_schema->get_table_name(),
"table_id", simple_table_schema->get_table_id());
// ignore table with no columns
br->set_is_valid(false);
} else {
br_data->setNewColumn(rv->new_column_array_, static_cast<int>(rv->column_num_));
br_data->setOldColumn(rv->old_column_array_, static_cast<int>(rv->column_num_));
ObRowDml current_dml_type = dml_type;
if (is_hbase_mode_put) {
current_dml_type = T_DML_INSERT;
// modify record type
RecordType type = get_record_type(current_dml_type);
if (OB_FAIL(br->setInsertRecordTypeForHBasePut(type))) {
LOG_ERROR("br setInsertRecordTypeForHBasePut fail", KR(ret), K(br),
"type", print_record_type(type),
"dml_type", print_dml_type(dml_type),
"current_dml_type", print_dml_type(current_dml_type),
"table_name", simple_table_schema->get_table_name(),
"table_id", simple_table_schema->get_table_id());
} else {
// succ
}
}
switch (current_dml_type) {
case T_DML_DELETE: {
ret = format_dml_delete_(br_data, rv);
break;
}
case T_DML_INSERT: {
ret = format_dml_insert_(br_data, rv);
break;
}
case T_DML_UPDATE: {
ret = format_dml_update_(br_data, rv);
break;
}
default: {
ret = OB_NOT_SUPPORTED;
LOG_ERROR("unknown DML type, not supported", K(current_dml_type));
break;
}
}
}
}
return ret;
}
int ObLogFormatter::is_hbase_mode_put_(const uint64_t table_id,
const ObRowDml &dml_type,
const int64_t column_number,
const int64_t new_column_cnt,
const bool contain_old_column,
bool &is_hbase_mode_put)
{
int ret = OB_SUCCESS;
is_hbase_mode_put = false;
bool is_hbase_table = false;
if (enable_hbase_mode_) {
if (OB_ISNULL(hbase_util_)) {
LOG_ERROR("hbase_util_ is null", K(hbase_util_));
ret = OB_ERR_UNEXPECTED;
} else if (OB_FAIL(hbase_util_->is_hbase_table(table_id, is_hbase_table))) {
LOG_ERROR("ObLogHbaseUtil is_hbase_table fail", KR(ret), K(table_id), K(is_hbase_table));
} else if (is_hbase_table && T_DML_UPDATE == dml_type && false == contain_old_column) {
if (column_number == new_column_cnt) {
is_hbase_mode_put = true;
} else if (skip_hbase_mode_put_column_count_not_consistency_) {
is_hbase_mode_put = true;
LOG_INFO("skip hbase mode put column count not consistency", K(table_id),
"dml_type", print_dml_type(dml_type),
"hbase_mode_put_column_cnt", new_column_cnt,
K(column_number));
} else {
LOG_ERROR("hbase mode put column cnt is not consistency", K(table_id),
"dml_type", print_dml_type(dml_type),
"hbase_mode_put_column_cnt", new_column_cnt,
K(column_number));
ret = OB_ERR_UNEXPECTED;
}
LOG_DEBUG("[HBASE] [PUT]", K(is_hbase_mode_put), K(table_id),
"dml_type", print_dml_type(dml_type),
K(column_number), K(new_column_cnt), K(contain_old_column));
} else {
// do nothing
}
}
return ret;
}
int ObLogFormatter::format_dml_delete_(ILogRecord *br_data, const RowValue *row_value)
{
int ret = OB_SUCCESS;
if (OB_ISNULL(br_data) || OB_ISNULL(row_value)) {
LOG_ERROR("invalid argument", K(br_data), K(row_value));
ret = OB_INVALID_ARGUMENT;
} else {
for (int64_t i = 0; OB_SUCCESS == ret && i < row_value->column_num_; i++) {
// Handling primary key values
if (row_value->is_rowkey_[i]) {
// The primary key value is taken from the primary key value recorded in the new columns, regardless of whether it is a full column log or not
// The primary key is set by the fill_rowkey_cols_() function, which must be placed in the new column
// DELETE operations use the original primary key value and do not need to use the primary key value from the old value
ObString *str = row_value->new_columns_[i];
if (OB_ISNULL(str)) {
LOG_ERROR("rowkey column is NULL, unexcepted error", K(i), K(row_value->column_num_));
ret = OB_ERR_UNEXPECTED;
} else {
br_data->putOld(str->ptr(), str->length());
}
}
// Handling non-primary key values
else {
if (row_value->contain_old_column_) {
// When full column logging, the non-rowkey column of oldCold is set to the corresponding value
// If the column value is not provided, then it is a new column and the corresponding original default value is set
ObString *str = row_value->old_columns_[i];
if (NULL == str) {
str = row_value->orig_default_value_[i];
}
if (OB_ISNULL(str)) {
LOG_ERROR("old column value and original default value are all invalid",
K(i), "column_num", row_value->column_num_);
ret = OB_ERR_UNEXPECTED;
} else {
br_data->putOld(str->ptr(), str->length());
}
} else {
// Non-rowkey columns of oldCold are set to no-change status for non-full column logging
bool is_changed = false;
if (OB_FAIL(ObLogBR::put_old(br_data, is_changed))) {
LOG_ERROR("put_old fail", KR(ret), K(br_data), K(is_changed));
}
}
}
}
}
return ret;
}
int ObLogFormatter::format_dml_insert_(ILogRecord *br_data, const RowValue *row_value)
{
int ret = OB_SUCCESS;
if (OB_ISNULL(br_data) || OB_ISNULL(row_value)) {
LOG_ERROR("invalid argument", K(br_data), K(row_value));
ret = OB_INVALID_ARGUMENT;
} else {
for (int64_t i = 0; OB_SUCCESS == ret && i < row_value->column_num_; i++) {
if (!row_value->is_changed_[i]) {
ObString *str_val = row_value->orig_default_value_[i];
if (OB_ISNULL(str_val)) {
LOG_ERROR("column original default value is NULL", K(i),
"column_num", row_value->column_num_);
ret = OB_ERR_UNEXPECTED;
} else {
br_data->putNew(str_val->ptr(), str_val->length());
}
} else {
ObString *str_val = row_value->new_columns_[i];
if (OB_ISNULL(str_val)) {
LOG_ERROR("changed column new value is NULL", K(i),
"column_num", row_value->column_num_);
ret = OB_ERR_UNEXPECTED;
} else {
br_data->putNew(str_val->ptr(), str_val->length());
}
}
// FIXME: No old values are populated, regardless of whether it is a full column log
}
}
return ret;
}
int ObLogFormatter::format_dml_update_(ILogRecord *br_data, const RowValue *row_value)
{
int ret = OB_SUCCESS;
if (OB_ISNULL(br_data) || OB_ISNULL(row_value)) {
LOG_ERROR("invalid argument", K(br_data), K(row_value));
ret = OB_INVALID_ARGUMENT;
} else {
for (int i = 0; OB_SUCCESS == ret && i < row_value->column_num_; i++) {
if (! row_value->is_changed_[i]) {
if (row_value->contain_old_column_) {
// In the case of a full column log, for update, if a column is not updated, the new value is filled with the value in old_column
// If there is no corresponding value in the old column either, the original default value is filled
ObString *str_val = row_value->old_columns_[i];
if (NULL == str_val) {
str_val = row_value->orig_default_value_[i];
}
if (OB_ISNULL(str_val)) {
LOG_ERROR("new column value, old column value and original default value "
"are all invalid",
K(i), "column_num", row_value->column_num_);
ret = OB_ERR_UNEXPECTED;
} else {
br_data->putNew(str_val->ptr(), str_val->length());
}
} else {
// Mark as unmodified when not a full column log
br_data->putNew(NULL, 0);
}
} else {
ObString *str_val = row_value->new_columns_[i];
if (OB_ISNULL(str_val)) {
LOG_ERROR("changed column new value is NULL", K(i),
"column_num", row_value->column_num_);
ret = OB_ERR_UNEXPECTED;
} else {
br_data->putNew(str_val->ptr(), str_val->length());
}
}
if (OB_SUCCESS == ret) {
if (row_value->contain_old_column_) {
// For full column logging, the old value is always filled with the value in old_column for updates
// If there is no valid value in the old column, the original default value is filled
ObString *str_val = row_value->old_columns_[i];
if (NULL == str_val) {
str_val = row_value->orig_default_value_[i];
}
if (OB_ISNULL(str_val)) {
LOG_ERROR("old column value and original default value are all invalid",
K(i), "column_num", row_value->column_num_);
ret = OB_ERR_UNEXPECTED;
} else {
br_data->putOld(str_val->ptr(), str_val->length());
}
} else {
// When not full column logging, for update, the old value is filled with whether the corresponding column has been modified
bool is_changed = row_value->is_changed_[i];
if (row_value->is_rowkey_[i]) {
is_changed = true;
}
if (OB_FAIL(ObLogBR::put_old(br_data, is_changed))) {
LOG_ERROR("put_old fail", KR(ret), K(br_data), K(is_changed));
}
}
}
} // end of for
}
return ret;
}
int ObLogFormatter::get_schema_(IObLogSchemaGetter *schema_getter,
const int64_t version,
const uint64_t table_id,
volatile bool &stop_flag,
ObLogSchemaGuard &schema_guard,
const TableSchemaType *&table_schema,
DBSchemaInfo &db_schema_info)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(! inited_)) {
LOG_ERROR("ObLogFormatter has not been initialized");
ret = OB_NOT_INIT;
} else if (OB_ISNULL(schema_getter) || OB_UNLIKELY(version <= 0)) {
LOG_ERROR("invalid argument", K(schema_getter), K(version));
ret = OB_INVALID_ARGUMENT;
} else {
int64_t refreshed_version = version;
const uint64_t pure_tb_id = extract_pure_id(table_id);
const uint64_t tenant_id = extract_tenant_id(table_id);
if (OB_ALL_SEQUENCE_VALUE_TID == pure_tb_id) {
ObLogTenantGuard guard;
ObLogTenant *tenant = NULL;
if (OB_FAIL(TCTX.get_tenant_guard(tenant_id, guard))) {
LOG_ERROR("get tenant fail", KR(ret), K(tenant_id));
} else if (OB_ISNULL(tenant = guard.get_tenant())) {
LOG_ERROR("invalid tenant", K(guard), K(tenant));
ret = OB_ERR_UNEXPECTED;
} else {
const int64_t tenant_start_schema_version = tenant->get_start_schema_version();
refreshed_version = max(version, tenant_start_schema_version);
}
}
// get schema guard
RETRY_FUNC(stop_flag, (*schema_getter), get_schema_guard_and_table_schema,
table_id,
refreshed_version,
GET_SCHEMA_TIMEOUT,
schema_guard,
table_schema);
if (OB_SUCCESS == ret && NULL != table_schema) {
uint64_t db_id = table_schema->get_database_id();
// Get database schema information, including name and version
RETRY_FUNC(stop_flag, schema_guard, get_database_schema_info, db_id, db_schema_info,
GET_SCHEMA_TIMEOUT);
}
}
return ret;
}
} // namespace liboblog
} // namespace oceanbase