init push
This commit is contained in:
410
src/sql/engine/cmd/ob_load_data_utils.cpp
Normal file
410
src/sql/engine/cmd/ob_load_data_utils.cpp
Normal file
@ -0,0 +1,410 @@
|
||||
/**
|
||||
* Copyright (c) 2021 OceanBase
|
||||
* OceanBase CE is licensed under Mulan PubL v2.
|
||||
* You can use this software according to the terms and conditions of the Mulan PubL v2.
|
||||
* You may obtain a copy of Mulan PubL v2 at:
|
||||
* http://license.coscl.org.cn/MulanPubL-2.0
|
||||
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
|
||||
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
|
||||
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
|
||||
* See the Mulan PubL v2 for more details.
|
||||
*/
|
||||
|
||||
#define USING_LOG_PREFIX SQL_ENG
|
||||
|
||||
#include "sql/engine/cmd/ob_load_data_utils.h"
|
||||
#include "sql/resolver/cmd/ob_load_data_stmt.h"
|
||||
#include "sql/session/ob_sql_session_info.h"
|
||||
|
||||
namespace oceanbase {
|
||||
using namespace common;
|
||||
namespace sql {
|
||||
|
||||
const char* ObLoadDataUtils::NULL_STRING = "NULL";
|
||||
const char ObLoadDataUtils::NULL_VALUE_FLAG = '\xff';
|
||||
|
||||
int ObLoadDataUtils::build_insert_sql_string_head(ObLoadDupActionType insert_mode, const ObString& table_name,
|
||||
const ObIArray<ObString>& insert_keys, ObSqlString& insertsql_keys)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
static const char* replace_stmt = "replace into ";
|
||||
static const char* insert_stmt = "insert into ";
|
||||
static const char* insert_ignore_stmt = "insert ignore into ";
|
||||
|
||||
const char* stmt_head = NULL;
|
||||
switch (insert_mode) {
|
||||
case ObLoadDupActionType::LOAD_REPLACE:
|
||||
stmt_head = replace_stmt;
|
||||
break;
|
||||
case ObLoadDupActionType::LOAD_IGNORE:
|
||||
stmt_head = insert_ignore_stmt;
|
||||
break;
|
||||
case ObLoadDupActionType::LOAD_STOP_ON_DUP:
|
||||
stmt_head = insert_stmt;
|
||||
break;
|
||||
default:
|
||||
ret = OB_NOT_SUPPORTED;
|
||||
LOG_WARN("not suppport insert mode", K(insert_mode));
|
||||
}
|
||||
|
||||
insertsql_keys.reuse();
|
||||
OZ(insertsql_keys.reserve(OB_MEDIUM_SQL_LENGTH));
|
||||
OZ(insertsql_keys.assign(stmt_head));
|
||||
OZ(insertsql_keys.append(table_name));
|
||||
OZ(insertsql_keys.append("("));
|
||||
for (int64_t i = 0; i < insert_keys.count(); ++i) {
|
||||
if (i != 0) {
|
||||
OZ(insertsql_keys.append(","));
|
||||
}
|
||||
OZ(insertsql_keys.append_fmt(
|
||||
share::is_oracle_mode() ? "\"%.*s\"" : "`%.*s`", insert_keys.at(i).length(), insert_keys.at(i).ptr()));
|
||||
}
|
||||
OZ(insertsql_keys.append(")"));
|
||||
|
||||
if (OB_FAIL(ret)) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql_keys.length()));
|
||||
}
|
||||
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObLoadDataUtils::append_values_in_remote_process(int64_t table_column_count, int64_t append_values_count,
|
||||
const ObExprValueBitSet& expr_bitset, const ObIArray<ObString>& insert_values, ObSqlString& insertsql,
|
||||
ObDataBuffer& data_buffer, int64_t skipped_row_count)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
if (OB_UNLIKELY(!insertsql.is_valid()) ||
|
||||
OB_UNLIKELY(append_values_count + skipped_row_count * table_column_count > insert_values.count()) ||
|
||||
OB_UNLIKELY(0 == table_column_count)) {
|
||||
ret = OB_INVALID_ARGUMENT;
|
||||
LOG_WARN("insert values are invalid", K(ret), K(insertsql), K(append_values_count), K(insert_values.count()));
|
||||
} else {
|
||||
int64_t row_count = append_values_count / table_column_count;
|
||||
if (OB_FAIL(insertsql.append(" values "))) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql.length()));
|
||||
}
|
||||
for (int64_t row_idx = 0; OB_SUCC(ret) && row_idx < row_count; ++row_idx) {
|
||||
if (OB_FAIL(append_values_for_one_row(
|
||||
table_column_count, expr_bitset, insert_values, insertsql, data_buffer, row_idx + skipped_row_count))) {
|
||||
LOG_WARN("append values for one row in remote process failed", K(ret));
|
||||
} else {
|
||||
if (row_idx + 1 != row_count) {
|
||||
if (OB_FAIL(insertsql.append(","))) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql.length()));
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObLoadDataUtils::append_values_for_one_row(const int64_t table_column_count,
|
||||
const ObExprValueBitSet& expr_value_bitset, const ObIArray<ObString>& insert_values, ObSqlString& insertsql,
|
||||
ObDataBuffer& data_buffer, const int64_t skipped_row_count)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
int64_t value_offset = skipped_row_count * table_column_count;
|
||||
|
||||
if (OB_UNLIKELY(skipped_row_count * table_column_count + table_column_count > insert_values.count())) {
|
||||
ret = OB_INVALID_ARGUMENT;
|
||||
LOG_WARN("invalid argument", K(skipped_row_count), K(table_column_count), K(insert_values.count()));
|
||||
}
|
||||
if (OB_SUCC(ret)) {
|
||||
if (OB_FAIL(insertsql.append("("))) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql.length()));
|
||||
}
|
||||
}
|
||||
for (int64_t i = 0; OB_SUCC(ret) && i < table_column_count; ++i) {
|
||||
const ObString& value = insert_values.at(i + value_offset);
|
||||
bool is_expr_value = expr_value_bitset.has_member(i);
|
||||
ObString cur_column_str;
|
||||
if (!is_expr_value) {
|
||||
cur_column_str = escape_quotation(value, data_buffer);
|
||||
remove_last_slash(cur_column_str);
|
||||
} else {
|
||||
cur_column_str = value;
|
||||
}
|
||||
if (i != 0) {
|
||||
if (OB_FAIL(insertsql.append(","))) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql.length()));
|
||||
}
|
||||
}
|
||||
if (OB_SUCC(ret)) {
|
||||
if (OB_FAIL(append_value(cur_column_str, insertsql, is_expr_value))) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql.length()), K(cur_column_str));
|
||||
}
|
||||
}
|
||||
}
|
||||
if (OB_SUCC(ret)) {
|
||||
if (OB_FAIL(insertsql.append(")"))) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql.length()));
|
||||
}
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObLoadDataUtils::append_value(const ObString& cur_column_str, ObSqlString& sqlstr_values, bool is_expr_value)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
if (!is_expr_value) {
|
||||
if (is_null_field(cur_column_str)) {
|
||||
if (OB_FAIL(sqlstr_values.append(NULL_STRING))) {
|
||||
LOG_WARN("append failed", K(ret));
|
||||
}
|
||||
} else {
|
||||
if (OB_FAIL(sqlstr_values.append_fmt("'%.*s'", cur_column_str.length(), cur_column_str.ptr()))) {
|
||||
LOG_WARN("append failed", K(ret));
|
||||
}
|
||||
}
|
||||
} else {
|
||||
if (OB_FAIL(sqlstr_values.append(cur_column_str))) {
|
||||
LOG_WARN("append failed", K(ret));
|
||||
}
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObLoadDataUtils::append_values_in_local_process(const int64_t key_columns, const int64_t values_count,
|
||||
const ObIArray<ObString>& insert_values, const ObExprValueBitSet& expr_value_bitset, ObSqlString& insertsql,
|
||||
ObDataBuffer& data_buffer)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
if (!insertsql.is_valid() || values_count > insert_values.count() || key_columns != values_count) {
|
||||
ret = OB_INVALID_ARGUMENT;
|
||||
LOG_WARN("insert values are invalid", K(ret), K(insertsql), K(values_count), K(insert_values.count()));
|
||||
} else {
|
||||
if (OB_FAIL(insertsql.append(" values "))) {
|
||||
LOG_WARN("append failed", K(ret), K(insertsql.length()));
|
||||
} else if (OB_FAIL(
|
||||
append_values_for_one_row(values_count, expr_value_bitset, insert_values, insertsql, data_buffer))) {
|
||||
LOG_WARN("append values for one row in local process failed", K(ret));
|
||||
}
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
ObString ObLoadDataUtils::escape_quotation(const ObString& value, ObDataBuffer& data_buf)
|
||||
{
|
||||
char* buf = data_buf.get_data();
|
||||
ObString result;
|
||||
|
||||
if (OB_ISNULL(buf)) {
|
||||
LOG_WARN("data buf is not inited");
|
||||
} else {
|
||||
// check if escape is needed
|
||||
bool need_escape = false;
|
||||
const char* src = value.ptr();
|
||||
int64_t str_len = value.length();
|
||||
ObLoadEscapeSM escape_sm;
|
||||
escape_sm.set_escape_char(ObLoadEscapeSM::ESCAPE_CHAR_MYSQL);
|
||||
for (int64_t i = 0; !need_escape && i < str_len; ++i) {
|
||||
if (*(src + i) == '\'' && !escape_sm.is_escaping()) {
|
||||
need_escape = true;
|
||||
}
|
||||
escape_sm.shift_by_input(*(src + i));
|
||||
}
|
||||
|
||||
if (!need_escape) {
|
||||
result = value;
|
||||
} else {
|
||||
int64_t pos = 0;
|
||||
escape_sm.reset();
|
||||
for (int64_t i = 0; i < str_len && pos < data_buf.get_capacity(); ++i) {
|
||||
if (*(src + i) == '\'' && !escape_sm.is_escaping()) {
|
||||
buf[pos++] = static_cast<char>(
|
||||
share::is_oracle_mode() ? ObLoadEscapeSM::ESCAPE_CHAR_ORACLE : ObLoadEscapeSM::ESCAPE_CHAR_MYSQL);
|
||||
}
|
||||
buf[pos++] = src[i];
|
||||
escape_sm.shift_by_input(*(src + i));
|
||||
}
|
||||
if (OB_UNLIKELY(pos >= data_buf.get_capacity())) {
|
||||
LOG_ERROR("data is too long"); // this should never happened, just for protection
|
||||
result.reset();
|
||||
} else {
|
||||
result.assign_ptr(buf, static_cast<int32_t>(pos));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return result;
|
||||
}
|
||||
|
||||
int ObLoadDataUtils::init_empty_string_array(ObIArray<ObString>& new_array, int64_t array_size)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
new_array.reset();
|
||||
for (int64_t i = 0; OB_SUCC(ret) && i < array_size; ++i) {
|
||||
if (OB_FAIL(new_array.push_back(ObString::make_empty_string()))) {
|
||||
LOG_WARN("push back empty string failed", K(ret));
|
||||
}
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
bool ObKMPStateMachine::scan_buf(char*& cur_pos, const char* buf_end)
|
||||
{
|
||||
bool matched = false;
|
||||
if (OB_UNLIKELY(!is_inited_ || NULL == cur_pos)) {
|
||||
LOG_ERROR("ObKmpStateMachine not inited.", K(cur_pos), K(buf_end));
|
||||
} else {
|
||||
for (; !matched && cur_pos < buf_end; cur_pos++) {
|
||||
while (matched_pos_ > 0 && *cur_pos != str_[matched_pos_]) {
|
||||
matched_pos_ = next_[matched_pos_];
|
||||
}
|
||||
if (*cur_pos == str_[matched_pos_]) {
|
||||
matched_pos_++;
|
||||
}
|
||||
if (matched_pos_ == str_len_) {
|
||||
matched_pos_ = 0;
|
||||
matched = true;
|
||||
}
|
||||
}
|
||||
}
|
||||
return matched;
|
||||
}
|
||||
|
||||
int ObKMPStateMachine::init(ObIAllocator& allocator, const ObString& str)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
void* next_buff = NULL;
|
||||
void* str_buff = NULL;
|
||||
int32_t str_len = str.length();
|
||||
if (OB_UNLIKELY(is_inited_)) {
|
||||
ret = OB_INIT_TWICE;
|
||||
LOG_WARN("init failed, init twice.", K(ret));
|
||||
} else if (OB_UNLIKELY(str_len > KEY_WORD_MAX_LENGTH) || OB_UNLIKELY(str_len <= 0)) {
|
||||
ret = OB_INVALID_ARGUMENT;
|
||||
LOG_WARN("init failed, invalid argument.", K(ret));
|
||||
} else if (OB_ISNULL(next_buff = allocator.alloc(str_len * sizeof(int32_t)))) {
|
||||
ret = OB_ALLOCATE_MEMORY_FAILED;
|
||||
LOG_WARN("init failed, no memory.", K(ret), K(str_len));
|
||||
} else if (OB_ISNULL(str_buff = allocator.alloc(str_len * sizeof(char)))) {
|
||||
ret = OB_ALLOCATE_MEMORY_FAILED;
|
||||
LOG_WARN("init failed, no memory.", K(ret), K(str_len));
|
||||
} else {
|
||||
str_len_ = str_len;
|
||||
next_ = static_cast<int32_t*>(next_buff);
|
||||
str_ = static_cast<char*>(str_buff);
|
||||
// copy string
|
||||
MEMCPY(str_, str.ptr(), str.length());
|
||||
matched_pos_ = 0;
|
||||
// calc kmp next arr
|
||||
int32_t k = 0;
|
||||
next_[0] = 0;
|
||||
for (int64_t i = 1; i < str_len_; ++i) {
|
||||
while (k > 0 && str_[k] != str_[i]) {
|
||||
k = next_[k];
|
||||
}
|
||||
if (str_[k] == str_[i]) {
|
||||
k++;
|
||||
}
|
||||
next_[i] = k;
|
||||
}
|
||||
// check error
|
||||
for (int64_t i = 0; OB_SUCC(ret) && i < str_len_; ++i) {
|
||||
if (OB_UNLIKELY(next_[i] < 0) || OB_UNLIKELY(next_[i] >= str_len_)) {
|
||||
ret = OB_ERR_UNEXPECTED;
|
||||
LOG_WARN("check next value failed", K(ret));
|
||||
}
|
||||
}
|
||||
if (OB_SUCC(ret)) {
|
||||
is_inited_ = true;
|
||||
}
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObLoadDataUtils::check_session_status(ObSQLSessionInfo& session, int64_t reserved_us)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
bool is_timeout = false;
|
||||
int64_t query_timeout = 0;
|
||||
int64_t query_start_time = session.get_query_start_time();
|
||||
int64_t current_time = ObTimeUtil::current_time();
|
||||
|
||||
if (OB_FAIL(session.get_query_timeout(query_timeout))) {
|
||||
LOG_WARN("fail to get query timeout", K(ret));
|
||||
} else if (OB_FAIL(session.is_timeout(is_timeout))) {
|
||||
ret = OB_ERR_UNEXPECTED;
|
||||
LOG_WARN("get session timeout info failed", K(ret));
|
||||
} else if (OB_UNLIKELY(query_start_time + query_timeout < current_time + reserved_us)) {
|
||||
ret = OB_TIMEOUT;
|
||||
LOG_WARN("query is timeout", K(ret));
|
||||
} else if (OB_UNLIKELY(is_timeout)) {
|
||||
ret = OB_TIMEOUT;
|
||||
LOG_WARN("session is timeout", K(ret));
|
||||
} else if (OB_UNLIKELY(session.is_query_killed())) {
|
||||
ret = OB_ERR_QUERY_INTERRUPTED;
|
||||
LOG_WARN("query is killed", K(ret));
|
||||
} else if (OB_UNLIKELY(session.is_zombie())) {
|
||||
ret = OB_SESSION_KILLED;
|
||||
LOG_WARN("session is killed", K(ret));
|
||||
}
|
||||
if (OB_FAIL(ret)) {
|
||||
LOG_WARN(
|
||||
"LOAD DATA timeout", K(ret), K(session.get_sessid()), K(query_timeout), K(query_start_time), K(current_time));
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObGlobalLoadDataStatMap::init()
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
if (IS_INIT) {
|
||||
ret = OB_INIT_TWICE;
|
||||
} else if (OB_FAIL(map_.create(bucket_num, ObModIds::OB_SQL_LOAD_DATA, ObModIds::OB_SQL_LOAD_DATA))) {
|
||||
ret = OB_ALLOCATE_MEMORY_FAILED;
|
||||
LOG_WARN("create hash table failed", K(ret));
|
||||
} else {
|
||||
is_inited_ = true;
|
||||
}
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObGlobalLoadDataStatMap::register_job(const ObLoadDataGID& id, ObLoadDataStat* job_status)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
if (IS_NOT_INIT) {
|
||||
ret = OB_NOT_INIT;
|
||||
}
|
||||
OZ(map_.set_refactored(id, job_status));
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObGlobalLoadDataStatMap::unregister_job(const ObLoadDataGID& id, ObLoadDataStat*& job_status)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
if (IS_NOT_INIT) {
|
||||
ret = OB_NOT_INIT;
|
||||
}
|
||||
OZ(map_.erase_refactored(id, &job_status));
|
||||
return ret;
|
||||
}
|
||||
|
||||
int ObGlobalLoadDataStatMap::get_job_status(const ObLoadDataGID& id, ObLoadDataStat*& job_status)
|
||||
{
|
||||
int ret = OB_SUCCESS;
|
||||
auto get_and_add_ref = [&](hash::HashMapPair<ObLoadDataGID, ObLoadDataStat*>& entry) -> void {
|
||||
entry.second->aquire();
|
||||
job_status = entry.second;
|
||||
};
|
||||
OZ(map_.read_atomic(id, get_and_add_ref));
|
||||
return ret;
|
||||
}
|
||||
|
||||
ObGlobalLoadDataStatMap* ObGlobalLoadDataStatMap::getInstance()
|
||||
{
|
||||
return instance_;
|
||||
}
|
||||
|
||||
ObGlobalLoadDataStatMap* ObGlobalLoadDataStatMap::instance_ = new ObGlobalLoadDataStatMap();
|
||||
|
||||
volatile int64_t ObLoadDataGID::GlobalLoadDataID = 0;
|
||||
|
||||
OB_SERIALIZE_MEMBER(ObLoadTaskStatus, task_status_);
|
||||
|
||||
OB_SERIALIZE_MEMBER(ObLoadDataGID, id);
|
||||
|
||||
} // namespace sql
|
||||
} // namespace oceanbase
|
||||
Reference in New Issue
Block a user