/** * Copyright (c) 2021 OceanBase * OceanBase CE is licensed under Mulan PubL v2. * You can use this software according to the terms and conditions of the Mulan PubL v2. * You may obtain a copy of Mulan PubL v2 at: * http://license.coscl.org.cn/MulanPubL-2.0 * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. * See the Mulan PubL v2 for more details. */ #define USING_LOG_PREFIX SQL_ENG #include "sql/engine/expr/ob_expr_find_in_set.h" #include "lib/charset/ob_charset.h" using namespace oceanbase::common; namespace oceanbase { namespace sql { ObExprFindInSet::ObExprFindInSet(ObIAllocator &alloc) : ObFuncExprOperator(alloc, T_FUN_SYS_FIND_IN_SET, "find_in_set", 2, NOT_ROW_DIMENSION) { } ObExprFindInSet::~ObExprFindInSet() { } int ObExprFindInSet::calc_result_type2(ObExprResType &type, ObExprResType &type1, ObExprResType &type2, ObExprTypeCtx &type_ctx) const { int ret = OB_SUCCESS; type1.set_calc_type(ObVarcharType); type2.set_calc_type(ObVarcharType); if (OB_LIKELY(NOT_ROW_DIMENSION == row_dimension_)) { type.set_uint64(); type.set_precision(ObAccuracy::DDL_DEFAULT_ACCURACY[ObUInt64Type].precision_); type.set_scale(ObAccuracy::DDL_DEFAULT_ACCURACY[ObUInt64Type].scale_); type.set_calc_type(ObVarcharType); ObExprOperator::calc_result_flag2(type, type1, type2); ObObjMeta coll_types[2]; coll_types[0].set_collation(type1); coll_types[1].set_collation(type2); if (OB_FAIL(aggregate_charsets_for_comparison(type.get_calc_meta(), coll_types, 2, type_ctx.get_coll_type()))) { LOG_WARN("failed to aggregate_charsets_for_comparison", K(ret)); } else { type1.set_calc_collation_type(type.get_collation_type()); type1.set_calc_collation_level(type.get_collation_level()); type2.set_calc_collation_type(type.get_collation_type()); type2.set_calc_collation_level(type.get_collation_level()); } } else { ret = OB_ERR_INVALID_TYPE_FOR_OP; } return ret; } int search(const ObString &str, const ObString &str_list, const ObCollationType &cs_type, uint64_t &res_pos); int search(const ObString &str, const ObString &str_list, const ObCollationType &cs_type, uint64_t &res_pos) { int ret = OB_SUCCESS; const char* first_ptr = str.ptr(); int64_t first_length = str.length(); // if first input string contains ',', return 0 if (ObCharset::locate(cs_type, first_ptr, first_length, ",", 1, 1) != 0) { res_pos = 0; } else { bool is_found = false; res_pos = 1; uint32_t pre_separtor_pos = 0; uint32_t cur_separtor_pos = 0; uint32_t pre_sep_pos_byte = 0; uint32_t cur_sep_pos_byte = 0; const char *second_ptr = str_list.ptr(); int64_t second_length = str_list.length(); while ((!is_found) && (cur_separtor_pos = ObCharset::locate(cs_type, second_ptr, second_length, ",", 1, cur_separtor_pos + 1)) != 0) { cur_sep_pos_byte = ObCharset::charpos(cs_type, second_ptr, second_length, cur_separtor_pos); if (ObCharset::strcmp(cs_type, first_ptr, first_length, second_ptr + pre_sep_pos_byte, cur_sep_pos_byte - pre_sep_pos_byte - 1) == 0) { is_found = true; } else { pre_separtor_pos = cur_separtor_pos; pre_sep_pos_byte = cur_sep_pos_byte; ++res_pos; } LOG_DEBUG("find_in_set debug", K(ret), K(pre_sep_pos_byte), K(cur_separtor_pos), K(pre_sep_pos_byte), K(cur_separtor_pos), K(is_found), K(res_pos)); } if (!is_found) { // match the last substring extracted from strlist if (ObCharset::strcmp(cs_type, first_ptr, first_length, second_ptr + pre_sep_pos_byte, second_length - pre_sep_pos_byte) == 0) { // do nothing } else { res_pos = 0; } } } return ret; } int ObExprFindInSet::calc_find_in_set_expr(const ObExpr &expr, ObEvalCtx &ctx, ObDatum &res_datum) { int ret = OB_SUCCESS; // find_in_set(str, strlist) ObDatum *str = NULL; ObDatum *strlist = NULL; if (OB_UNLIKELY(2 != expr.arg_cnt_)) { ret = OB_ERR_UNEXPECTED; LOG_WARN("unexpected arg cnt", K(ret)); } else if (OB_FAIL(expr.eval_param_value(ctx, str, strlist))) { LOG_WARN("eval arg failed", K(ret)); } else if (str->is_null() || strlist->is_null()) { res_datum.set_null(); } else { const ObCollationType &cs_type = expr.args_[0]->datum_meta_.cs_type_; uint64_t res_pos = 0; if (OB_UNLIKELY(expr.args_[0]->datum_meta_.cs_type_ != expr.args_[1]->datum_meta_.cs_type_ || !ObCharset::is_valid_collation(static_cast(cs_type)))) { ret = OB_ERR_UNEXPECTED; LOG_WARN("invalid cs_type", K(ret), K(cs_type)); } else if (OB_FAIL(search(str->get_string(), strlist->get_string(), cs_type, res_pos))) { LOG_WARN("search str in str list failed", K(ret)); } else { res_datum.set_uint(res_pos); } } return ret; } int ObExprFindInSet::cg_expr(ObExprCGCtx &expr_cg_ctx, const ObRawExpr &raw_expr, ObExpr &rt_expr) const { int ret = OB_SUCCESS; UNUSED(expr_cg_ctx); UNUSED(raw_expr); rt_expr.eval_func_ = calc_find_in_set_expr; return ret; } } /* namespace sql */ } /* namespace oceanbase */