/** * Copyright (c) 2021 OceanBase * OceanBase CE is licensed under Mulan PubL v2. * You can use this software according to the terms and conditions of the Mulan PubL v2. * You may obtain a copy of Mulan PubL v2 at: * http://license.coscl.org.cn/MulanPubL-2.0 * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. * See the Mulan PubL v2 for more details. */ #define USING_LOG_PREFIX SQL_ENG #include "lib/oblog/ob_log.h" #include "sql/engine/expr/ob_expr_initcap.h" #include "objit/common/ob_item_type.h" #include "common/data_buffer.h" #include "sql/session/ob_sql_session_info.h" namespace oceanbase { using namespace common; namespace sql { ObExprInitcap::ObExprInitcap(ObIAllocator &alloc) : ObStringExprOperator(alloc, T_FUN_SYS_INITCAP, N_INITCAP, 1) { } ObExprInitcap::~ObExprInitcap() { } int ObExprInitcap::calc_result_type1(ObExprResType &type, ObExprResType &text, ObExprTypeCtx &type_ctx) const { int ret = OB_SUCCESS; const ObBasicSessionInfo *session = type_ctx.get_session(); ObSEArray params; CK(OB_NOT_NULL(session)); OZ(params.push_back(&text)); OZ(aggregate_string_type_and_charset_oracle(*session, params, type, PREFER_VAR_LEN_CHAR)); OZ(deduce_string_param_calc_type_and_charset(*session, type, params)); if (OB_SUCC(ret)) { common::ObLength result_len = text.get_calc_length(); if (OB_UNLIKELY(!ObCharset::is_valid_collation(type.get_collation_type()))) { ret = OB_INVALID_ARGUMENT; LOG_WARN("invalid charset", K(type), K(ret)); } else { result_len *= ObCharset::get_charset(type.get_collation_type())->caseup_multiply; type.set_length(result_len); } } return ret; } int ObExprInitcap::initcap_string(const ObString &text, const ObCollationType cs_type, ObIAllocator *allocator, ObString &res_str) { int ret = OB_SUCCESS; if (OB_ISNULL(allocator)) { ret = OB_INVALID_ARGUMENT; LOG_WARN("allocator is null", K(ret)); } else { int64_t case_multiply = std::max(ObCharset::get_charset(cs_type)->caseup_multiply, ObCharset::get_charset(cs_type)->casedn_multiply); int64_t buf_len = case_multiply * text.length(); char *buf = static_cast(allocator->alloc(buf_len)); int64_t pos = 0; if (OB_ISNULL(buf)) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("alloc memory failed", K(text.length()), K(case_multiply), K(cs_type), K(ret)); } else { ObStringScanner scanner(text, cs_type); ObString cur_letter; int32_t wchar = 0; bool has_first_letter = false; if (1 == case_multiply) { MEMCPY(buf, text.ptr(), text.length()); } while (OB_SUCC(ret)) { if (OB_ITER_END == (ret = scanner.next_character(cur_letter, wchar))) { ret = OB_SUCCESS; break; } else if (OB_FAIL(ret)) { LOG_WARN("fail to get next character", K(ret), K(scanner)); } else { bool is_alphanumeric = (wchar <= INT8_MAX && ob_isalnum(ObCharset::get_charset(CS_TYPE_UTF8MB4_GENERAL_CI), wchar)); if (is_alphanumeric) { char *src_ptr = (1 == case_multiply) ? buf + pos : cur_letter.ptr(); int64_t buf_remain = cur_letter.length() * case_multiply; int64_t write_len = has_first_letter ? ObCharset::casedn(cs_type, src_ptr, cur_letter.length(), buf + pos, buf_remain) : ObCharset::caseup(cs_type, src_ptr, cur_letter.length(), buf + pos, buf_remain); if (OB_UNLIKELY(0 == write_len)) { ret = OB_ERR_UNEXPECTED; } else { pos += write_len; } has_first_letter = true; } else { has_first_letter = false; MEMCPY(buf + pos, cur_letter.ptr(), cur_letter.length()); pos += cur_letter.length(); } } } if (OB_SUCC(ret)) { res_str.assign_ptr(buf, pos); } } } return ret; } int calc_initcap_expr(const ObExpr &expr, ObEvalCtx &ctx, ObDatum &res_datum) { int ret = OB_SUCCESS; ObDatum *arg_datum = NULL; ObString res_str; char *res_buf = NULL; ObCollationType cs_type = expr.args_[0]->datum_meta_.cs_type_; int64_t case_multiply = std::max(ObCharset::get_charset(cs_type)->caseup_multiply, ObCharset::get_charset(cs_type)->casedn_multiply); if (OB_FAIL(expr.args_[0]->eval(ctx, arg_datum))) { LOG_WARN("eval arg 0 failed", K(ret), K(expr)); } else if (arg_datum->is_null()) { res_datum.set_null(); } else if (OB_ISNULL(res_buf = expr.get_str_res_mem(ctx, arg_datum->len_ * case_multiply))) { ret = OB_ALLOCATE_MEMORY_FAILED; LOG_WARN("allocate memory failed", K(ret)); } else { ObDataBuffer buf_alloc(res_buf, arg_datum->len_ * case_multiply); if (OB_FAIL(ObExprInitcap::initcap_string(arg_datum->get_string(), expr.args_[0]->datum_meta_.cs_type_, &buf_alloc, res_str))) { LOG_WARN("initcap string failed", K(ret), K(arg_datum->get_string())); } else if (0 == res_str.length()) { // initcap is only for oracle mode. set res be null when string length is 0. res_datum.set_null(); } else { res_datum.set_string(res_str); } } return ret; } int ObExprInitcap::cg_expr(ObExprCGCtx &expr_cg_ctx, const ObRawExpr &raw_expr, ObExpr &rt_expr) const { int ret = OB_SUCCESS; UNUSED(expr_cg_ctx); UNUSED(raw_expr); rt_expr.eval_func_ = calc_initcap_expr; return ret; } } /* sql */ } /* oceanbase */