init push

This commit is contained in:
oceanbase-admin
2021-05-31 22:56:52 +08:00
commit cea7de1475
7020 changed files with 5689869 additions and 0 deletions

View File

@ -0,0 +1,410 @@
/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX SQL_ENG
#include "sql/engine/cmd/ob_load_data_utils.h"
#include "sql/resolver/cmd/ob_load_data_stmt.h"
#include "sql/session/ob_sql_session_info.h"
namespace oceanbase {
using namespace common;
namespace sql {
const char* ObLoadDataUtils::NULL_STRING = "NULL";
const char ObLoadDataUtils::NULL_VALUE_FLAG = '\xff';
int ObLoadDataUtils::build_insert_sql_string_head(ObLoadDupActionType insert_mode, const ObString& table_name,
const ObIArray<ObString>& insert_keys, ObSqlString& insertsql_keys)
{
int ret = OB_SUCCESS;
static const char* replace_stmt = "replace into ";
static const char* insert_stmt = "insert into ";
static const char* insert_ignore_stmt = "insert ignore into ";
const char* stmt_head = NULL;
switch (insert_mode) {
case ObLoadDupActionType::LOAD_REPLACE:
stmt_head = replace_stmt;
break;
case ObLoadDupActionType::LOAD_IGNORE:
stmt_head = insert_ignore_stmt;
break;
case ObLoadDupActionType::LOAD_STOP_ON_DUP:
stmt_head = insert_stmt;
break;
default:
ret = OB_NOT_SUPPORTED;
LOG_WARN("not suppport insert mode", K(insert_mode));
}
insertsql_keys.reuse();
OZ(insertsql_keys.reserve(OB_MEDIUM_SQL_LENGTH));
OZ(insertsql_keys.assign(stmt_head));
OZ(insertsql_keys.append(table_name));
OZ(insertsql_keys.append("("));
for (int64_t i = 0; i < insert_keys.count(); ++i) {
if (i != 0) {
OZ(insertsql_keys.append(","));
}
OZ(insertsql_keys.append_fmt(
share::is_oracle_mode() ? "\"%.*s\"" : "`%.*s`", insert_keys.at(i).length(), insert_keys.at(i).ptr()));
}
OZ(insertsql_keys.append(")"));
if (OB_FAIL(ret)) {
LOG_WARN("append failed", K(ret), K(insertsql_keys.length()));
}
return ret;
}
int ObLoadDataUtils::append_values_in_remote_process(int64_t table_column_count, int64_t append_values_count,
const ObExprValueBitSet& expr_bitset, const ObIArray<ObString>& insert_values, ObSqlString& insertsql,
ObDataBuffer& data_buffer, int64_t skipped_row_count)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(!insertsql.is_valid()) ||
OB_UNLIKELY(append_values_count + skipped_row_count * table_column_count > insert_values.count()) ||
OB_UNLIKELY(0 == table_column_count)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("insert values are invalid", K(ret), K(insertsql), K(append_values_count), K(insert_values.count()));
} else {
int64_t row_count = append_values_count / table_column_count;
if (OB_FAIL(insertsql.append(" values "))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
}
for (int64_t row_idx = 0; OB_SUCC(ret) && row_idx < row_count; ++row_idx) {
if (OB_FAIL(append_values_for_one_row(
table_column_count, expr_bitset, insert_values, insertsql, data_buffer, row_idx + skipped_row_count))) {
LOG_WARN("append values for one row in remote process failed", K(ret));
} else {
if (row_idx + 1 != row_count) {
if (OB_FAIL(insertsql.append(","))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
}
}
}
}
}
return ret;
}
int ObLoadDataUtils::append_values_for_one_row(const int64_t table_column_count,
const ObExprValueBitSet& expr_value_bitset, const ObIArray<ObString>& insert_values, ObSqlString& insertsql,
ObDataBuffer& data_buffer, const int64_t skipped_row_count)
{
int ret = OB_SUCCESS;
int64_t value_offset = skipped_row_count * table_column_count;
if (OB_UNLIKELY(skipped_row_count * table_column_count + table_column_count > insert_values.count())) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(skipped_row_count), K(table_column_count), K(insert_values.count()));
}
if (OB_SUCC(ret)) {
if (OB_FAIL(insertsql.append("("))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
}
}
for (int64_t i = 0; OB_SUCC(ret) && i < table_column_count; ++i) {
const ObString& value = insert_values.at(i + value_offset);
bool is_expr_value = expr_value_bitset.has_member(i);
ObString cur_column_str;
if (!is_expr_value) {
cur_column_str = escape_quotation(value, data_buffer);
remove_last_slash(cur_column_str);
} else {
cur_column_str = value;
}
if (i != 0) {
if (OB_FAIL(insertsql.append(","))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
}
}
if (OB_SUCC(ret)) {
if (OB_FAIL(append_value(cur_column_str, insertsql, is_expr_value))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()), K(cur_column_str));
}
}
}
if (OB_SUCC(ret)) {
if (OB_FAIL(insertsql.append(")"))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
}
}
return ret;
}
int ObLoadDataUtils::append_value(const ObString& cur_column_str, ObSqlString& sqlstr_values, bool is_expr_value)
{
int ret = OB_SUCCESS;
if (!is_expr_value) {
if (is_null_field(cur_column_str)) {
if (OB_FAIL(sqlstr_values.append(NULL_STRING))) {
LOG_WARN("append failed", K(ret));
}
} else {
if (OB_FAIL(sqlstr_values.append_fmt("'%.*s'", cur_column_str.length(), cur_column_str.ptr()))) {
LOG_WARN("append failed", K(ret));
}
}
} else {
if (OB_FAIL(sqlstr_values.append(cur_column_str))) {
LOG_WARN("append failed", K(ret));
}
}
return ret;
}
int ObLoadDataUtils::append_values_in_local_process(const int64_t key_columns, const int64_t values_count,
const ObIArray<ObString>& insert_values, const ObExprValueBitSet& expr_value_bitset, ObSqlString& insertsql,
ObDataBuffer& data_buffer)
{
int ret = OB_SUCCESS;
if (!insertsql.is_valid() || values_count > insert_values.count() || key_columns != values_count) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("insert values are invalid", K(ret), K(insertsql), K(values_count), K(insert_values.count()));
} else {
if (OB_FAIL(insertsql.append(" values "))) {
LOG_WARN("append failed", K(ret), K(insertsql.length()));
} else if (OB_FAIL(
append_values_for_one_row(values_count, expr_value_bitset, insert_values, insertsql, data_buffer))) {
LOG_WARN("append values for one row in local process failed", K(ret));
}
}
return ret;
}
ObString ObLoadDataUtils::escape_quotation(const ObString& value, ObDataBuffer& data_buf)
{
char* buf = data_buf.get_data();
ObString result;
if (OB_ISNULL(buf)) {
LOG_WARN("data buf is not inited");
} else {
// check if escape is needed
bool need_escape = false;
const char* src = value.ptr();
int64_t str_len = value.length();
ObLoadEscapeSM escape_sm;
escape_sm.set_escape_char(ObLoadEscapeSM::ESCAPE_CHAR_MYSQL);
for (int64_t i = 0; !need_escape && i < str_len; ++i) {
if (*(src + i) == '\'' && !escape_sm.is_escaping()) {
need_escape = true;
}
escape_sm.shift_by_input(*(src + i));
}
if (!need_escape) {
result = value;
} else {
int64_t pos = 0;
escape_sm.reset();
for (int64_t i = 0; i < str_len && pos < data_buf.get_capacity(); ++i) {
if (*(src + i) == '\'' && !escape_sm.is_escaping()) {
buf[pos++] = static_cast<char>(
share::is_oracle_mode() ? ObLoadEscapeSM::ESCAPE_CHAR_ORACLE : ObLoadEscapeSM::ESCAPE_CHAR_MYSQL);
}
buf[pos++] = src[i];
escape_sm.shift_by_input(*(src + i));
}
if (OB_UNLIKELY(pos >= data_buf.get_capacity())) {
LOG_ERROR("data is too long"); // this should never happened, just for protection
result.reset();
} else {
result.assign_ptr(buf, static_cast<int32_t>(pos));
}
}
}
return result;
}
int ObLoadDataUtils::init_empty_string_array(ObIArray<ObString>& new_array, int64_t array_size)
{
int ret = OB_SUCCESS;
new_array.reset();
for (int64_t i = 0; OB_SUCC(ret) && i < array_size; ++i) {
if (OB_FAIL(new_array.push_back(ObString::make_empty_string()))) {
LOG_WARN("push back empty string failed", K(ret));
}
}
return ret;
}
bool ObKMPStateMachine::scan_buf(char*& cur_pos, const char* buf_end)
{
bool matched = false;
if (OB_UNLIKELY(!is_inited_ || NULL == cur_pos)) {
LOG_ERROR("ObKmpStateMachine not inited.", K(cur_pos), K(buf_end));
} else {
for (; !matched && cur_pos < buf_end; cur_pos++) {
while (matched_pos_ > 0 && *cur_pos != str_[matched_pos_]) {
matched_pos_ = next_[matched_pos_];
}
if (*cur_pos == str_[matched_pos_]) {
matched_pos_++;
}
if (matched_pos_ == str_len_) {
matched_pos_ = 0;
matched = true;
}
}
}
return matched;
}
int ObKMPStateMachine::init(ObIAllocator& allocator, const ObString& str)
{
int ret = OB_SUCCESS;
void* next_buff = NULL;
void* str_buff = NULL;
int32_t str_len = str.length();
if (OB_UNLIKELY(is_inited_)) {
ret = OB_INIT_TWICE;
LOG_WARN("init failed, init twice.", K(ret));
} else if (OB_UNLIKELY(str_len > KEY_WORD_MAX_LENGTH) || OB_UNLIKELY(str_len <= 0)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("init failed, invalid argument.", K(ret));
} else if (OB_ISNULL(next_buff = allocator.alloc(str_len * sizeof(int32_t)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("init failed, no memory.", K(ret), K(str_len));
} else if (OB_ISNULL(str_buff = allocator.alloc(str_len * sizeof(char)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("init failed, no memory.", K(ret), K(str_len));
} else {
str_len_ = str_len;
next_ = static_cast<int32_t*>(next_buff);
str_ = static_cast<char*>(str_buff);
// copy string
MEMCPY(str_, str.ptr(), str.length());
matched_pos_ = 0;
// calc kmp next arr
int32_t k = 0;
next_[0] = 0;
for (int64_t i = 1; i < str_len_; ++i) {
while (k > 0 && str_[k] != str_[i]) {
k = next_[k];
}
if (str_[k] == str_[i]) {
k++;
}
next_[i] = k;
}
// check error
for (int64_t i = 0; OB_SUCC(ret) && i < str_len_; ++i) {
if (OB_UNLIKELY(next_[i] < 0) || OB_UNLIKELY(next_[i] >= str_len_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("check next value failed", K(ret));
}
}
if (OB_SUCC(ret)) {
is_inited_ = true;
}
}
return ret;
}
int ObLoadDataUtils::check_session_status(ObSQLSessionInfo& session, int64_t reserved_us)
{
int ret = OB_SUCCESS;
bool is_timeout = false;
int64_t query_timeout = 0;
int64_t query_start_time = session.get_query_start_time();
int64_t current_time = ObTimeUtil::current_time();
if (OB_FAIL(session.get_query_timeout(query_timeout))) {
LOG_WARN("fail to get query timeout", K(ret));
} else if (OB_FAIL(session.is_timeout(is_timeout))) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("get session timeout info failed", K(ret));
} else if (OB_UNLIKELY(query_start_time + query_timeout < current_time + reserved_us)) {
ret = OB_TIMEOUT;
LOG_WARN("query is timeout", K(ret));
} else if (OB_UNLIKELY(is_timeout)) {
ret = OB_TIMEOUT;
LOG_WARN("session is timeout", K(ret));
} else if (OB_UNLIKELY(session.is_query_killed())) {
ret = OB_ERR_QUERY_INTERRUPTED;
LOG_WARN("query is killed", K(ret));
} else if (OB_UNLIKELY(session.is_zombie())) {
ret = OB_SESSION_KILLED;
LOG_WARN("session is killed", K(ret));
}
if (OB_FAIL(ret)) {
LOG_WARN(
"LOAD DATA timeout", K(ret), K(session.get_sessid()), K(query_timeout), K(query_start_time), K(current_time));
}
return ret;
}
int ObGlobalLoadDataStatMap::init()
{
int ret = OB_SUCCESS;
if (IS_INIT) {
ret = OB_INIT_TWICE;
} else if (OB_FAIL(map_.create(bucket_num, ObModIds::OB_SQL_LOAD_DATA, ObModIds::OB_SQL_LOAD_DATA))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("create hash table failed", K(ret));
} else {
is_inited_ = true;
}
return ret;
}
int ObGlobalLoadDataStatMap::register_job(const ObLoadDataGID& id, ObLoadDataStat* job_status)
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
}
OZ(map_.set_refactored(id, job_status));
return ret;
}
int ObGlobalLoadDataStatMap::unregister_job(const ObLoadDataGID& id, ObLoadDataStat*& job_status)
{
int ret = OB_SUCCESS;
if (IS_NOT_INIT) {
ret = OB_NOT_INIT;
}
OZ(map_.erase_refactored(id, &job_status));
return ret;
}
int ObGlobalLoadDataStatMap::get_job_status(const ObLoadDataGID& id, ObLoadDataStat*& job_status)
{
int ret = OB_SUCCESS;
auto get_and_add_ref = [&](hash::HashMapPair<ObLoadDataGID, ObLoadDataStat*>& entry) -> void {
entry.second->aquire();
job_status = entry.second;
};
OZ(map_.read_atomic(id, get_and_add_ref));
return ret;
}
ObGlobalLoadDataStatMap* ObGlobalLoadDataStatMap::getInstance()
{
return instance_;
}
ObGlobalLoadDataStatMap* ObGlobalLoadDataStatMap::instance_ = new ObGlobalLoadDataStatMap();
volatile int64_t ObLoadDataGID::GlobalLoadDataID = 0;
OB_SERIALIZE_MEMBER(ObLoadTaskStatus, task_status_);
OB_SERIALIZE_MEMBER(ObLoadDataGID, id);
} // namespace sql
} // namespace oceanbase