patch 4.0

This commit is contained in:
wangzelin.wzl
2022-10-24 10:34:53 +08:00
parent 4ad6e00ec3
commit 93a1074b0c
10533 changed files with 2588271 additions and 2299373 deletions

View File

@ -10,7 +10,7 @@
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX SQL_ENG
#define USING_LOG_PREFIX SQL_ENG
#include "sql/engine/cmd/ob_load_data_utils.h"
#include "sql/resolver/cmd/ob_load_data_stmt.h"
@ -20,46 +20,48 @@ namespace oceanbase {
using namespace common;
namespace sql {
const char* ObLoadDataUtils::NULL_STRING = "NULL";
const char *ObLoadDataUtils::NULL_STRING = "NULL";
const char ObLoadDataUtils::NULL_VALUE_FLAG = '\xff';
int ObLoadDataUtils::build_insert_sql_string_head(ObLoadDupActionType insert_mode, const ObString& table_name,
const ObIArray<ObString>& insert_keys, ObSqlString& insertsql_keys)
int ObLoadDataUtils::build_insert_sql_string_head(ObLoadDupActionType insert_mode,
const ObString &table_name,
const ObIArray<ObString> &insert_keys,
ObSqlString &insertsql_keys)
{
int ret = OB_SUCCESS;
static const char* replace_stmt = "replace into ";
static const char* insert_stmt = "insert into ";
static const char* insert_ignore_stmt = "insert ignore into ";
static const char *replace_stmt = "replace into ";
static const char *insert_stmt = "insert into ";
static const char *insert_ignore_stmt = "insert ignore into ";
const char* stmt_head = NULL;
const char *stmt_head = NULL;
switch (insert_mode) {
case ObLoadDupActionType::LOAD_REPLACE:
stmt_head = replace_stmt;
break;
case ObLoadDupActionType::LOAD_IGNORE:
stmt_head = insert_ignore_stmt;
break;
case ObLoadDupActionType::LOAD_STOP_ON_DUP:
stmt_head = insert_stmt;
break;
default:
ret = OB_NOT_SUPPORTED;
LOG_WARN("not suppport insert mode", K(insert_mode));
case ObLoadDupActionType::LOAD_REPLACE:
stmt_head = replace_stmt;
break;
case ObLoadDupActionType::LOAD_IGNORE:
stmt_head = insert_ignore_stmt;
break;
case ObLoadDupActionType::LOAD_STOP_ON_DUP:
stmt_head = insert_stmt;
break;
default:
ret = OB_NOT_SUPPORTED;
LOG_WARN("not suppport insert mode", K(insert_mode));
}
insertsql_keys.reuse();
OZ(insertsql_keys.reserve(OB_MEDIUM_SQL_LENGTH));
OZ(insertsql_keys.assign(stmt_head));
OZ(insertsql_keys.append(table_name));
OZ(insertsql_keys.append("("));
OZ (insertsql_keys.reserve(OB_MEDIUM_SQL_LENGTH));
OZ (insertsql_keys.assign(stmt_head));
OZ (insertsql_keys.append(table_name));
OZ (insertsql_keys.append("("));
for (int64_t i = 0; i < insert_keys.count(); ++i) {
if (i != 0) {
OZ(insertsql_keys.append(","));
OZ (insertsql_keys.append(","));
}
OZ(insertsql_keys.append_fmt(
share::is_oracle_mode() ? "\"%.*s\"" : "`%.*s`", insert_keys.at(i).length(), insert_keys.at(i).ptr()));
OZ (insertsql_keys.append_fmt(lib::is_oracle_mode() ? "\"%.*s\"" : "`%.*s`",
insert_keys.at(i).length(), insert_keys.at(i).ptr()));
}
OZ(insertsql_keys.append(")"));
OZ (insertsql_keys.append(")"));
if (OB_FAIL(ret)) {
LOG_WARN("append failed", K(ret), K(insertsql_keys.length()));
@ -68,24 +70,33 @@ int ObLoadDataUtils::build_insert_sql_string_head(ObLoadDupActionType insert_mod
return ret;
}
int ObLoadDataUtils::append_values_in_remote_process(int64_t table_column_count, int64_t append_values_count,
const ObExprValueBitSet& expr_bitset, const ObIArray<ObString>& insert_values, ObSqlString& insertsql,
ObDataBuffer& data_buffer, int64_t skipped_row_count)
int ObLoadDataUtils::append_values_in_remote_process(int64_t table_column_count,
int64_t append_values_count,
const ObExprValueBitSet &expr_bitset,
const ObIArray<ObString> &insert_values,
ObSqlString &insertsql,
ObDataBuffer &data_buffer,
int64_t skipped_row_count)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!insertsql.is_valid()) ||
OB_UNLIKELY(append_values_count + skipped_row_count * table_column_count > insert_values.count()) ||
OB_UNLIKELY(0 == table_column_count)) {
if (OB_UNLIKELY(!insertsql.is_valid())
|| OB_UNLIKELY(append_values_count + skipped_row_count * table_column_count > insert_values.count())
|| OB_UNLIKELY(0 == table_column_count)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("insert values are invalid", K(ret), K(insertsql), K(append_values_count), K(insert_values.count()));
} else {
int64_t row_count = append_values_count / table_column_count;
int64_t row_count = append_values_count/table_column_count;
if (OB_FAIL(insertsql.append(" values "))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
}
for (int64_t row_idx = 0; OB_SUCC(ret) && row_idx < row_count; ++row_idx) {
if (OB_FAIL(append_values_for_one_row(
table_column_count, expr_bitset, insert_values, insertsql, data_buffer, row_idx + skipped_row_count))) {
if (OB_FAIL(append_values_for_one_row(table_column_count,
expr_bitset,
insert_values,
insertsql,
data_buffer,
row_idx + skipped_row_count))) {
LOG_WARN("append values for one row in remote process failed", K(ret));
} else {
if (row_idx + 1 != row_count) {
@ -99,9 +110,13 @@ int ObLoadDataUtils::append_values_in_remote_process(int64_t table_column_count,
return ret;
}
int ObLoadDataUtils::append_values_for_one_row(const int64_t table_column_count,
const ObExprValueBitSet& expr_value_bitset, const ObIArray<ObString>& insert_values, ObSqlString& insertsql,
ObDataBuffer& data_buffer, const int64_t skipped_row_count)
const ObExprValueBitSet &expr_value_bitset,
const ObIArray<ObString> &insert_values,
ObSqlString &insertsql,
ObDataBuffer &data_buffer,
const int64_t skipped_row_count)
{
int ret = OB_SUCCESS;
int64_t value_offset = skipped_row_count * table_column_count;
@ -116,7 +131,7 @@ int ObLoadDataUtils::append_values_for_one_row(const int64_t table_column_count,
}
}
for (int64_t i = 0; OB_SUCC(ret) && i < table_column_count; ++i) {
const ObString& value = insert_values.at(i + value_offset);
const ObString &value = insert_values.at(i + value_offset);
bool is_expr_value = expr_value_bitset.has_member(i);
ObString cur_column_str;
if (!is_expr_value) {
@ -144,7 +159,7 @@ int ObLoadDataUtils::append_values_for_one_row(const int64_t table_column_count,
return ret;
}
int ObLoadDataUtils::append_value(const ObString& cur_column_str, ObSqlString& sqlstr_values, bool is_expr_value)
int ObLoadDataUtils::append_value(const ObString &cur_column_str, ObSqlString &sqlstr_values, bool is_expr_value)
{
int ret = OB_SUCCESS;
if (!is_expr_value) {
@ -165,9 +180,13 @@ int ObLoadDataUtils::append_value(const ObString& cur_column_str, ObSqlString& s
return ret;
}
int ObLoadDataUtils::append_values_in_local_process(const int64_t key_columns, const int64_t values_count,
const ObIArray<ObString>& insert_values, const ObExprValueBitSet& expr_value_bitset, ObSqlString& insertsql,
ObDataBuffer& data_buffer)
int ObLoadDataUtils::append_values_in_local_process(const int64_t key_columns,
const int64_t values_count,
const ObIArray<ObString> &insert_values,
const ObExprValueBitSet &expr_value_bitset,
ObSqlString &insertsql,
ObDataBuffer &data_buffer)
{
int ret = OB_SUCCESS;
if (!insertsql.is_valid() || values_count > insert_values.count() || key_columns != values_count) {
@ -176,25 +195,29 @@ int ObLoadDataUtils::append_values_in_local_process(const int64_t key_columns, c
} else {
if (OB_FAIL(insertsql.append(" values "))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
} else if (OB_FAIL(
append_values_for_one_row(values_count, expr_value_bitset, insert_values, insertsql, data_buffer))) {
} else if (OB_FAIL(append_values_for_one_row(values_count,
expr_value_bitset,
insert_values,
insertsql,
data_buffer))) {
LOG_WARN("append values for one row in local process failed", K(ret));
}
}
return ret;
}
ObString ObLoadDataUtils::escape_quotation(const ObString& value, ObDataBuffer& data_buf)
ObString ObLoadDataUtils::escape_quotation(const ObString &value, ObDataBuffer &data_buf)
{
char* buf = data_buf.get_data();
char *buf = data_buf.get_data();
ObString result;
if (OB_ISNULL(buf)) {
LOG_WARN("data buf is not inited");
} else {
// check if escape is needed
//check if escape is needed
bool need_escape = false;
const char* src = value.ptr();
const char *src = value.ptr();
int64_t str_len = value.length();
ObLoadEscapeSM escape_sm;
escape_sm.set_escape_char(ObLoadEscapeSM::ESCAPE_CHAR_MYSQL);
@ -212,14 +235,14 @@ ObString ObLoadDataUtils::escape_quotation(const ObString& value, ObDataBuffer&
escape_sm.reset();
for (int64_t i = 0; i < str_len && pos < data_buf.get_capacity(); ++i) {
if (*(src + i) == '\'' && !escape_sm.is_escaping()) {
buf[pos++] = static_cast<char>(
share::is_oracle_mode() ? ObLoadEscapeSM::ESCAPE_CHAR_ORACLE : ObLoadEscapeSM::ESCAPE_CHAR_MYSQL);
buf[pos++] = static_cast<char>(lib::is_oracle_mode() ?
ObLoadEscapeSM::ESCAPE_CHAR_ORACLE : ObLoadEscapeSM::ESCAPE_CHAR_MYSQL);
}
buf[pos++] = src[i];
escape_sm.shift_by_input(*(src + i));
}
if (OB_UNLIKELY(pos >= data_buf.get_capacity())) {
LOG_ERROR("data is too long"); // this should never happened, just for protection
LOG_ERROR("data is too long"); //this should never happened, just for protection
result.reset();
} else {
result.assign_ptr(buf, static_cast<int32_t>(pos));
@ -230,7 +253,7 @@ ObString ObLoadDataUtils::escape_quotation(const ObString& value, ObDataBuffer&
return result;
}
int ObLoadDataUtils::init_empty_string_array(ObIArray<ObString>& new_array, int64_t array_size)
int ObLoadDataUtils::init_empty_string_array(ObIArray<ObString> &new_array, int64_t array_size)
{
int ret = OB_SUCCESS;
new_array.reset();
@ -242,13 +265,13 @@ int ObLoadDataUtils::init_empty_string_array(ObIArray<ObString>& new_array, int6
return ret;
}
bool ObKMPStateMachine::scan_buf(char*& cur_pos, const char* buf_end)
bool ObKMPStateMachine::scan_buf(char *&cur_pos, const char *buf_end)
{
bool matched = false;
if (OB_UNLIKELY(!is_inited_ || NULL == cur_pos)) {
LOG_ERROR("ObKmpStateMachine not inited.", K(cur_pos), K(buf_end));
} else {
for (; !matched && cur_pos < buf_end; cur_pos++) {
for (;!matched && cur_pos < buf_end; cur_pos++) {
while (matched_pos_ > 0 && *cur_pos != str_[matched_pos_]) {
matched_pos_ = next_[matched_pos_];
}
@ -264,11 +287,11 @@ bool ObKMPStateMachine::scan_buf(char*& cur_pos, const char* buf_end)
return matched;
}
int ObKMPStateMachine::init(ObIAllocator& allocator, const ObString& str)
int ObKMPStateMachine::init(ObIAllocator &allocator, const ObString &str)
{
int ret = OB_SUCCESS;
void* next_buff = NULL;
void* str_buff = NULL;
void *next_buff = NULL;
void *str_buff = NULL;
int32_t str_len = str.length();
if (OB_UNLIKELY(is_inited_)) {
ret = OB_INIT_TWICE;
@ -285,15 +308,15 @@ int ObKMPStateMachine::init(ObIAllocator& allocator, const ObString& str)
} else {
str_len_ = str_len;
next_ = static_cast<int32_t*>(next_buff);
str_ = static_cast<char*>(str_buff);
// copy string
str_ = static_cast<char *>(str_buff);
//copy string
MEMCPY(str_, str.ptr(), str.length());
matched_pos_ = 0;
// calc kmp next arr
//calc kmp next arr
int32_t k = 0;
next_[0] = 0;
for (int64_t i = 1; i < str_len_; ++i) {
while (k > 0 && str_[k] != str_[i]) {
while(k > 0 && str_[k] != str_[i]) {
k = next_[k];
}
if (str_[k] == str_[i]) {
@ -301,7 +324,7 @@ int ObKMPStateMachine::init(ObIAllocator& allocator, const ObString& str)
}
next_[i] = k;
}
// check error
//check error
for (int64_t i = 0; OB_SUCC(ret) && i < str_len_; ++i) {
if (OB_UNLIKELY(next_[i] < 0) || OB_UNLIKELY(next_[i] >= str_len_)) {
ret = OB_ERR_UNEXPECTED;
@ -315,8 +338,7 @@ int ObKMPStateMachine::init(ObIAllocator& allocator, const ObString& str)
return ret;
}
int ObLoadDataUtils::check_session_status(ObSQLSessionInfo& session, int64_t reserved_us)
{
int ObLoadDataUtils::check_session_status(ObSQLSessionInfo &session, int64_t reserved_us) {
int ret = OB_SUCCESS;
bool is_timeout = false;
int64_t query_timeout = 0;
@ -326,24 +348,19 @@ int ObLoadDataUtils::check_session_status(ObSQLSessionInfo& session, int64_t res
if (OB_FAIL(session.get_query_timeout(query_timeout))) {
LOG_WARN("fail to get query timeout", K(ret));
} else if (OB_FAIL(session.is_timeout(is_timeout))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("get session timeout info failed", K(ret));
} else if (OB_UNLIKELY(query_start_time + query_timeout < current_time + reserved_us)) {
} else if (OB_UNLIKELY(query_start_time + query_timeout
< current_time + reserved_us)) {
ret = OB_TIMEOUT;
LOG_WARN("query is timeout", K(ret));
} else if (OB_UNLIKELY(is_timeout)) {
ret = OB_TIMEOUT;
LOG_WARN("session is timeout", K(ret));
} else if (OB_UNLIKELY(session.is_query_killed())) {
ret = OB_ERR_QUERY_INTERRUPTED;
LOG_WARN("query is killed", K(ret));
} else if (OB_UNLIKELY(session.is_zombie())) {
ret = OB_SESSION_KILLED;
LOG_WARN("session is killed", K(ret));
} else if (OB_FAIL(session.check_session_status())) {
LOG_WARN("session's state is not OB_SUCCESS", K(ret));
}
if (OB_FAIL(ret)) {
LOG_WARN(
"LOAD DATA timeout", K(ret), K(session.get_sessid()), K(query_timeout), K(query_start_time), K(current_time));
LOG_WARN("LOAD DATA timeout", K(ret), K(session.get_sessid()), K(query_timeout), K(query_start_time), K(current_time));
}
return ret;
}
@ -353,7 +370,9 @@ int ObGlobalLoadDataStatMap::init()
int ret = OB_SUCCESS;
if (IS_INIT) {
ret = OB_INIT_TWICE;
} else if (OB_FAIL(map_.create(bucket_num, ObModIds::OB_SQL_LOAD_DATA, ObModIds::OB_SQL_LOAD_DATA))) {
} else if (OB_FAIL(map_.create(bucket_num,
ObModIds::OB_SQL_LOAD_DATA,
ObModIds::OB_SQL_LOAD_DATA))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("create hash table failed", K(ret));
} else {
@ -362,43 +381,104 @@ int ObGlobalLoadDataStatMap::init()
return ret;
}
int ObGlobalLoadDataStatMap::register_job(const ObLoadDataGID& id, ObLoadDataStat* job_status)
int ObGlobalLoadDataStatMap::register_job(const ObLoadDataGID &id, ObLoadDataStat *job_status)
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
}
OZ(map_.set_refactored(id, job_status));
OZ (map_.set_refactored(id, job_status));
return ret;
}
int ObGlobalLoadDataStatMap::unregister_job(const ObLoadDataGID& id, ObLoadDataStat*& job_status)
int ObGlobalLoadDataStatMap::unregister_job(const ObLoadDataGID &id, ObLoadDataStat *&job_status)
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
}
OZ(map_.erase_refactored(id, &job_status));
OZ (map_.erase_refactored(id, &job_status));
return ret;
}
int ObGlobalLoadDataStatMap::get_job_status(const ObLoadDataGID& id, ObLoadDataStat*& job_status)
int ObGlobalLoadDataStatMap::get_job_status(const ObLoadDataGID &id, ObLoadDataStat *&job_status)
{
int ret = OB_SUCCESS;
auto get_and_add_ref = [&](hash::HashMapPair<ObLoadDataGID, ObLoadDataStat*>& entry) -> void {
auto get_and_add_ref = [&](hash::HashMapPair<ObLoadDataGID, ObLoadDataStat*> &entry) -> void
{
entry.second->aquire();
job_status = entry.second;
};
OZ(map_.read_atomic(id, get_and_add_ref));
OZ (map_.read_atomic(id, get_and_add_ref));
return ret;
}
ObGlobalLoadDataStatMap* ObGlobalLoadDataStatMap::getInstance()
int ObGlobalLoadDataStatMap::get_all_job_status(ObGetAllJobStatusOp &job_status_op)
{
int ret = OB_SUCCESS;
OZ (map_.foreach_refactored(job_status_op));
return ret;
}
ObGetAllJobStatusOp::ObGetAllJobStatusOp()
: job_status_array_(),
current_job_index_(0)
{
}
ObGetAllJobStatusOp::~ObGetAllJobStatusOp()
{
reset();
}
void ObGetAllJobStatusOp::reset()
{
ObLoadDataStat *job_status;
for (int i = 0; i < job_status_array_.count(); i++) {
job_status = job_status_array_.at(i);
job_status->release();
}
job_status_array_.reset();
current_job_index_ = 0;
}
int ObGetAllJobStatusOp::operator()(common::hash::HashMapPair<ObLoadDataGID, ObLoadDataStat *> &entry)
{
int ret = OB_SUCCESS;
entry.second->aquire();
if (OB_FAIL(job_status_array_.push_back(entry.second))) {
entry.second->release();
LOG_WARN("push_back ObLoadDataStat failed", K(ret));
}
return ret;
}
ObLoadDataStat* ObGetAllJobStatusOp::next_job_status()
{
ObLoadDataStat *job_status = nullptr;
if (current_job_index_ < job_status_array_.count()) {
job_status = job_status_array_.at(current_job_index_++);
}
return job_status;
}
bool ObGetAllJobStatusOp::end()
{
return (current_job_index_ >= job_status_array_.count());
}
ObGlobalLoadDataStatMap *ObGlobalLoadDataStatMap::getInstance()
{
return instance_;
}
ObGlobalLoadDataStatMap* ObGlobalLoadDataStatMap::instance_ = new ObGlobalLoadDataStatMap();
ObGlobalLoadDataStatMap *ObGlobalLoadDataStatMap::instance_ = new ObGlobalLoadDataStatMap();
volatile int64_t ObLoadDataGID::GlobalLoadDataID = 0;
@ -406,5 +486,8 @@ OB_SERIALIZE_MEMBER(ObLoadTaskStatus, task_status_);
OB_SERIALIZE_MEMBER(ObLoadDataGID, id);
} // namespace sql
} // namespace oceanbase
}
}