Files
oceanbase/src/sql/engine/expr/ob_expr_column_conv.cpp
wanghangQ 5cbd86c9e6 [FEAT MERGE] Vector Index & Array Type
Co-authored-by: helloamateur <magiccheery@163.com>
Co-authored-by: skylhd <dickylhd@gmail.com>
Co-authored-by: JLY2015 <1623359870@qq.com>
2024-08-29 07:52:22 +00:00

780 lines
34 KiB
C++

/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX SQL_ENG
#include "lib/utility/ob_macro_utils.h"
#include "sql/engine/expr/ob_expr_column_conv.h"
#include "sql/engine/expr/ob_datum_cast.h"
#include "sql/session/ob_sql_session_info.h"
#include "common/sql_mode/ob_sql_mode_utils.h"
#include "sql/engine/expr/ob_expr_type_to_str.h"
#include "sql/engine/ob_exec_context.h"
#include "sql/engine/expr/ob_expr_lob_utils.h"
#include "lib/geo/ob_geo_utils.h"
#include "sql/resolver/expr/ob_raw_expr_util.h"
using namespace oceanbase::common;
namespace oceanbase
{
namespace sql
{
ObFastColumnConvExpr::ObFastColumnConvExpr(ObIAllocator &alloc)
: ObBaseExprColumnConv(alloc),
ObFastExprOperator(T_FUN_COLUMN_CONV),
column_type_(alloc),
value_item_(),
column_info_()
{
}
int ObFastColumnConvExpr::assign(const ObFastExprOperator &other)
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(other.get_op_type() != T_FUN_COLUMN_CONV)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument", K(other.get_op_type()));
} else {
const ObFastColumnConvExpr &other_conv = static_cast<const ObFastColumnConvExpr&>(other);
column_type_ = other_conv.column_type_;
value_item_ = other_conv.value_item_;
if (OB_FAIL(ob_write_string(alloc_, other_conv.column_info_, column_info_))) {
LOG_WARN("fail to set column info", K(ret));
}
}
return ret;
}
int ObFastColumnConvExpr::calc(ObExprCtx &expr_ctx, const ObNewRow &row, ObObj &result) const
{
int ret = OB_SUCCESS;
if (OB_UNLIKELY(OB_ISNULL(expr_ctx.my_session_))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("expr context is invalid", K(ret), K(expr_ctx.my_session_), K(expr_ctx.phy_plan_ctx_));
} else {
bool is_strict = is_strict_mode(expr_ctx.my_session_->get_sql_mode());
const ObObj *value = NULL;
const ObString *column_info = NULL;
if (has_column_info()) {
column_info = &column_info_;
}
if (OB_FAIL(value_item_.get_item_value_directly(*expr_ctx.phy_plan_ctx_, row, value))) {
LOG_WARN("get item value directly from value item failed", K(ret), K_(value_item));
} else if (OB_FAIL(ObSqlExpressionUtil::expand_array_params(expr_ctx, *value, value))) {
LOG_WARN("expand array params failed", K(ret));
} else if (OB_FAIL(ObExprColumnConv::convert_skip_null_check(result, *value, column_type_,
is_strict, expr_ctx.column_conv_ctx_,
&str_values_, column_info))) {
LOG_WARN("convert column value failed", K(ret), K(*this));
}
}
return ret;
}
int ObFastColumnConvExpr::set_const_value(const ObObj &value)
{
int ret = OB_SUCCESS;
ObObj tmp;
if (OB_FAIL(ob_write_obj(alloc_, value, tmp))) {
LOG_WARN("write const value failed", K(ret));
} else if (OB_FAIL(value_item_.assign(tmp))) {
LOG_WARN("write value item failed", K(ret));
}
return ret;
}
//由于在14x的版本中ObExprColumnConv使用的是父类ObExprOperator的序列化函数
//为了保证兼容性,这里先序列化父类ObExprOperator的成员,再序列化自身的成员
OB_SERIALIZE_MEMBER(ObExprColumnConv, row_dimension_, real_param_num_, result_type_, input_types_, id_, str_values_);
ObExprColumnConv::ObExprColumnConv(ObIAllocator &alloc)
: ObBaseExprColumnConv(alloc),
ObFuncExprOperator(alloc, T_FUN_COLUMN_CONV, N_COLUMN_CONV, -1, NOT_VALID_FOR_GENERATED_COL, NOT_ROW_DIMENSION,
INTERNAL_IN_MYSQL_MODE, INTERNAL_IN_ORACLE_MODE)
{
disable_operand_auto_cast();
//obexprcolumnconv有自己特殊处理,不走字符集自动转换框架
need_charset_convert_ = false;
}
ObExprColumnConv::~ObExprColumnConv()
{
}
int ObExprColumnConv::assign(const ObExprOperator &other)
{
int ret = OB_SUCCESS;
const ObExprColumnConv *tmp_other = dynamic_cast<const ObExprColumnConv *>(&other);
if (OB_UNLIKELY(NULL == tmp_other)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid argument. wrong type for other", K(ret), K(other));
} else if (OB_LIKELY(this != tmp_other)) {
if (OB_FAIL(ObFuncExprOperator::assign(other))) {
LOG_WARN("copy in Base class ObFuncExprOperator failed", K(ret));
} else if (tmp_other->str_values_.count() > 0 &&
OB_FAIL(deep_copy_str_values(tmp_other->str_values_))) {
LOG_WARN("copy str_values failed", K(ret));
}
}
return ret;
}
int ObExprColumnConv::convert_with_null_check(ObObj &result,
const ObObj &obj,
const ObExprResType &res_type,
bool is_strict,
ObCastCtx &cast_ctx,
const ObIArray<ObString> *type_infos)
{
int ret = OB_SUCCESS;
bool is_not_null = res_type.is_not_null_for_write();
if (OB_FAIL(ObExprColumnConv::convert_skip_null_check(result, obj, res_type, is_strict,
cast_ctx, type_infos))) {
LOG_WARN("fail to convert skip null check", K(ret));
} else if (is_not_null && (result.is_null() || (lib::is_oracle_mode() && result.is_null_oracle()))) {
ret = OB_BAD_NULL_ERROR;
LOG_WARN("Column should not be null", K(ret));
}
return ret;
}
int ObExprColumnConv::convert_skip_null_check(ObObj &result,
const ObObj &obj,
const ObExprResType &res_type,
bool is_strict,
ObCastCtx &cast_ctx,
const ObIArray<ObString> *type_infos,
const ObString *column_info)
{
int ret = OB_SUCCESS;
ObObjType type = res_type.get_type();
const ObAccuracy &accuracy = res_type.get_accuracy();
ObCollationType collation_type = res_type.get_collation_type();
const ObObj *res_obj = NULL;
cast_ctx.expect_obj_collation_ = collation_type;
cast_ctx.dest_collation_ = collation_type;
ObAccuracy tmp_accuracy = accuracy;
cast_ctx.res_accuracy_ = &tmp_accuracy;
if (OB_UNLIKELY(ob_is_enum_or_set_type(type))) {
ObExpectType expect_type;
expect_type.set_type(type);
expect_type.set_collation_type(collation_type);
expect_type.set_type_infos(type_infos);
if (OB_FAIL(ObObjCaster::to_type(expect_type, cast_ctx, obj, result))) {
LOG_WARN("fail to cast to enum or set", K(obj), K(expect_type), K(ret));
} else {
res_obj = &result;
}
} else if (OB_FAIL(ObObjCaster::to_type(type, cast_ctx, obj, result, res_obj)) || OB_ISNULL(res_obj)) {
ret = COVER_SUCC(OB_ERR_UNEXPECTED);
LOG_WARN("failed to cast object", K(ret), K(obj), "type", type);
} else {
LOG_DEBUG("succ to to_type", K(type), K(obj), K(result), K(collation_type));
}
if (OB_SUCC(ret)) {
const int64_t max_accuracy_len = static_cast<int64_t>(res_type.
get_accuracy().get_length());
const int64_t str_len_byte = static_cast<int64_t>(result.get_string_len());
if (OB_FAIL(obj_collation_check(is_strict, collation_type, *const_cast<ObObj*>(res_obj)))) {
LOG_WARN("failed to check collation", K(ret), K(collation_type), KPC(res_obj));
} else if (OB_FAIL(obj_accuracy_check(cast_ctx, accuracy, collation_type, *res_obj, result, res_obj))) {
LOG_WARN("failed to check accuracy", K(ret), K(accuracy), K(collation_type), KPC(res_obj));
if (OB_ERR_DATA_TOO_LONG == ret && lib::is_oracle_mode()
&& OB_NOT_NULL(column_info) && !column_info->empty()) {
int64_t col_length = str_len_byte;
if (ObStringTC == ob_obj_type_class(type)
&& !is_oracle_byte_length(lib::is_oracle_mode(), accuracy.get_length_semantics())) {
col_length = ObCharset::strlen_char(collation_type, result.get_string().ptr(), str_len_byte);
}
LOG_ORACLE_USER_ERROR(OB_ERR_DATA_TOO_LONG_MSG_FMT_V2, column_info->length(),
column_info->ptr(), col_length, max_accuracy_len);
}
}
}
if (OB_SUCC(ret)) {
if (res_obj != &result) {
//res_obj没有指向result的地址,需要将res_obj的值拷贝到result中
result = *res_obj;
}
// if (is_not_null && (result.is_null() || (is_oracle_mode() && result.is_null_oracle()))) {
// ret = OB_BAD_NULL_ERROR;
// LOG_WARN("Column should not be null", K(ret));
// }
}
return ret;
}
int ObExprColumnConv::calc_result_typeN(ObExprResType &type,
ObExprResType *types,
int64_t param_num,
common::ObExprTypeCtx &type_ctx) const
{
int ret = common::OB_SUCCESS;
//objs[0] type
//objs[1] collation_type
//objs[2] accuray_expr
//objs[3] nullable_expr
//objs[4] value
//objs[5] column_info
ObCollationType coll_type = CS_TYPE_INVALID;
if (OB_ISNULL(type_ctx.get_session()) || OB_ISNULL(type_ctx.get_raw_expr())) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("session is NULL or raw expr is NULL", K(ret));
} else if (OB_UNLIKELY(((PARAMS_COUNT_WITHOUT_COLUMN_INFO != param_num)
&& (PARAMS_COUNT_WITH_COLUMN_INFO != param_num))
|| OB_ISNULL(types))) {
ret = OB_INVALID_ARGUMENT;
SQL_ENG_LOG(WARN, "invalid argument, param_num should be 5 or 6",
K(param_num), K(types), K(ret));
} else if (OB_FAIL(type_ctx.get_session()->get_collation_connection(coll_type))) {
SQL_ENG_LOG(WARN, "fail to get_collation_connection", K(coll_type), K(ret));
} else {
type.set_type(types[0].get_type());
type.set_collation_type(types[1].get_collation_type());
// set collation level
ObCollationLevel coll_level = ObRawExprUtils::get_column_collation_level(types[0].get_type());
type.set_collation_level(coll_level);
type.set_accuracy(types[2].get_accuracy());
if (type.get_type() == ObUserDefinedSQLType
|| type.get_type() == ObCollectionSQLType) {
uint64_t udt_id = types[2].get_accuracy().get_accuracy();
uint16_t subschema_id = ObMaxSystemUDTSqlType;
// need const cast to modify subschema ctx, in physcial plan ctx belong to cur exec_ctx;
ObSQLSessionInfo *session = const_cast<ObSQLSessionInfo *>(type_ctx.get_session());
ObExecContext *exec_ctx = OB_ISNULL(session) ? NULL : session->get_cur_exec_ctx();
if (udt_id == T_OBJ_XML) {
subschema_id = ObXMLSqlType;
} else if (OB_ISNULL(exec_ctx)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("need context to search subschema mapping", K(ret), K(udt_id));
} else if (str_values_.count() > 0) {
// array type
if (OB_FAIL(exec_ctx->get_subschema_id_by_type_string(str_values_.at(0), subschema_id))) {
LOG_WARN("failed to get array type subschema id", K(ret));
}
} else if (OB_FAIL(exec_ctx->get_subschema_id_by_udt_id(udt_id, subschema_id))) {
LOG_WARN("failed to get sub schema id", K(ret), K(udt_id));
}
if (OB_SUCC(ret)) {
type.set_subschema_id(subschema_id);
}
}
if (types[3].is_not_null_for_read()) {
type.set_result_flag(NOT_NULL_FLAG | NOT_NULL_WRITE_FLAG);
}
bool enumset_to_varchar = false;
//here will wrap type_to_str if necessary
if (OB_SUCC(ret) && ob_is_enumset_tc(types[4].get_type())) {
ObObjType calc_type = enumset_calc_types_[OBJ_TYPE_TO_CLASS[types[0].get_type()]];
if (OB_UNLIKELY(ObMaxType == calc_type)) {
ret = OB_ERR_UNEXPECTED;
SQL_ENG_LOG(WARN, "invalid type of parameter ", K(types[4]), K(types), K(ret));
} else if (ObVarcharType == calc_type) {
enumset_to_varchar = true;
types[4].set_calc_type(calc_type);
types[4].set_calc_collation_type(coll_type);
types[4].set_calc_collation_level(CS_LEVEL_IMPLICIT);
type_ctx.set_cast_mode(type_ctx.get_cast_mode() | type_ctx.get_raw_expr()->get_extra());
}
}
// for table modify in oracle mode, we ignore charset convert failed
if (OB_SUCC(ret) && lib::is_oracle_mode()) {
type_ctx.set_cast_mode(type_ctx.get_cast_mode() | CM_CHARSET_CONVERT_IGNORE_ERR);
}
if (OB_SUCC(ret) &&
OB_FAIL(ObCharset::check_valid_implicit_convert(types[4].get_collation_type(),
types[1].get_collation_type()))) {
LOG_WARN("failed to check valid implicit convert", K(ret));
}
if (OB_SUCC(ret) && !enumset_to_varchar) {
//cast type when type not same.
const ObObjTypeClass value_tc = ob_obj_type_class(types[4].get_type());
const ObObjTypeClass type_tc = ob_obj_type_class(types[0].get_type());
ObSQLSessionInfo *session = const_cast<ObSQLSessionInfo *>(type_ctx.get_session());
bool is_prepare_stage = session->is_pl_prepare_stage();
if (lib::is_oracle_mode()
&& OB_UNLIKELY(!cast_supported(types[4].get_type(), types[4].get_collation_type(),
types[0].get_type(), types[1].get_collation_type()))
&& !(is_prepare_stage && type_tc == ObGeometryTC)) {
ret = OB_ERR_INVALID_TYPE_FOR_OP;
LOG_WARN("inconsistent datatypes", "expected", type_tc, "got", value_tc);
} else {
type_ctx.set_cast_mode(type_ctx.get_cast_mode() |
type_ctx.get_raw_expr()->get_extra() |
CM_COLUMN_CONVERT);
types[4].set_calc_meta(type);
if (ob_is_number_or_decimal_int_tc(type.get_type())) {
// decimal/number int need to setup calc accuracy
types[4].set_calc_accuracy(type.get_accuracy());
type.set_collation_level(common::CS_LEVEL_NUMERIC);
} else if (ob_is_user_defined_type(type.get_type())
|| ob_is_collection_sql_type(type.get_type())) { // if calc meta is udt, set calc udt id
types[4].set_calc_accuracy(type.get_accuracy());
}
}
}
LOG_DEBUG("finish calc_result_typeN", K(type), K(types[4]), K(types[0]), K(enumset_to_varchar));
}
return ret;
}
int ObExprColumnConv::cg_expr(ObExprCGCtx &op_cg_ctx,
const ObRawExpr &raw_expr,
ObExpr &rt_expr) const
{
int ret = OB_SUCCESS;
UNUSED(raw_expr);
//compatible with old code
CK((PARAMS_COUNT_WITHOUT_COLUMN_INFO == rt_expr.arg_cnt_)
|| (PARAMS_COUNT_WITH_COLUMN_INFO == rt_expr.arg_cnt_));
if (OB_ISNULL(op_cg_ctx.session_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("exec ctx is null", K(ret));
} else if (OB_FAIL(ObEnumSetInfo::init_enum_set_info(op_cg_ctx.allocator_, rt_expr, type_,
raw_expr.get_extra(), str_values_))) {
LOG_WARN("fail to init_enum_set_info", K(ret), K(type_), K(str_values_));
} else {
ObEnumSetInfo *enumset_info = static_cast<ObEnumSetInfo *>(rt_expr.extra_info_);
if (op_cg_ctx.session_->is_ignore_stmt()) {
enumset_info->cast_mode_ = enumset_info->cast_mode_ | CM_WARN_ON_FAIL
| CM_CHARSET_CONVERT_IGNORE_ERR;
}
enumset_info->cast_mode_ |= CM_COLUMN_CONVERT;
if (GET_MIN_CLUSTER_VERSION() >= CLUSTER_VERSION_4_3_3_0
&& (enumset_info->cast_mode_ & CM_FAST_COLUMN_CONV)
&& !ob_is_enum_or_set_type(rt_expr.datum_meta_.type_)) {
rt_expr.eval_func_ = column_convert_fast;
if (rt_expr.args_[4]->is_batch_result()) {
rt_expr.eval_batch_func_ = column_convert_batch_fast;
}
} else {
rt_expr.eval_func_ = column_convert;
if (rt_expr.args_[4]->is_batch_result()
&& !ob_is_enum_or_set_type(rt_expr.datum_meta_.type_)
&& !is_lob_storage(rt_expr.datum_meta_.type_)
&& GET_MIN_CLUSTER_VERSION() >= CLUSTER_VERSION_4_3_3_0) {
rt_expr.eval_batch_func_ = column_convert_batch;
}
}
}
return ret;
}
static OB_INLINE int column_convert_datum_accuracy_check(const ObExpr &expr,
ObEvalCtx &ctx,
bool has_lob_header,
ObDatum &datum,
const uint64_t &cast_mode,
ObDatum &datum_for_check)
{
int ret = OB_SUCCESS;
int warning = OB_SUCCESS;
const int64_t max_accuracy_len = static_cast<int64_t>(expr.max_length_);
const int64_t str_len_byte = static_cast<int64_t>(datum_for_check.len_);
if (OB_FAIL(datum_accuracy_check(expr,
cast_mode,
ctx,
has_lob_header,
datum_for_check,
datum,
warning))) {
LOG_WARN("fail to check accuracy", K(ret), K(expr), K(warning));
//compatible with old code
if (OB_ERR_DATA_TOO_LONG == ret && lib::is_oracle_mode()
&& ObExprColumnConv::PARAMS_COUNT_WITH_COLUMN_INFO == expr.arg_cnt_) {
ObString column_info_str;
ObDatum *column_info = NULL;
if (OB_FAIL(expr.args_[5]->eval(ctx, column_info))) {
LOG_WARN("evaluate parameter failed", K(ret));
} else {
column_info_str = column_info->get_string();
int64_t col_length = str_len_byte;
if (ObStringTC == ob_obj_type_class(expr.datum_meta_.get_type())
&& !is_oracle_byte_length(lib::is_oracle_mode(), expr.datum_meta_.length_semantics_)) {
col_length = ObCharset::strlen_char(expr.datum_meta_.cs_type_, datum_for_check.ptr_, str_len_byte);
}
LOG_ORACLE_USER_ERROR(OB_ERR_DATA_TOO_LONG_MSG_FMT_V2, column_info_str.length(),
column_info_str.ptr(), col_length, max_accuracy_len);
}
ret = OB_ERR_DATA_TOO_LONG;
}
}
if (OB_SUCC(ret) && lib::is_mysql_mode() && OB_ERR_DATA_TOO_LONG == warning) {
ObDatum *column_info = NULL;
int64_t rownum = ctx.exec_ctx_.get_cur_rownum();
if (rownum > 0
&& ObExprColumnConv::PARAMS_COUNT_WITH_COLUMN_INFO == expr.arg_cnt_
&& OB_SUCCESS == expr.args_[5]->eval(ctx, column_info)) {
LOG_USER_WARN(OB_ERR_DATA_TRUNCATED, column_info->get_string().length(),
column_info->get_string().ptr(), rownum);
}
}
return ret;
}
int enum_set_valid_check(const uint64_t val, const int64_t str_values_count, const bool is_enum)
{
int ret = common::OB_SUCCESS;
if (OB_UNLIKELY(str_values_count <= 0)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected str values count", K(ret), K(str_values_count), K(is_enum));
} else if (is_enum && (val > str_values_count)) {
// ENUM type, its value should not exceed str_values_count
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected enum value", K(ret), K(val), K(str_values_count));
} else if (!is_enum && (str_values_count < OB_MAX_SET_ELEMENT_NUM) &&
(val >= (1UL << str_values_count))) {
// SET type, its value should not be greater than or equal to 2^(str_values_count)
ret = OB_ERR_UNEXPECTED;
LOG_WARN("unexpected set value", K(ret), K(val), K(str_values_count));
}
return ret;
}
int ObExprColumnConv::column_convert(const ObExpr &expr,
ObEvalCtx &ctx,
ObDatum &datum)
{
int ret = OB_SUCCESS;
if (OB_ISNULL(expr.extra_info_)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("extra_info_ is unexpected", K(ret), KP(expr.extra_info_));
} else {
const ObEnumSetInfo *enumset_info = static_cast<ObEnumSetInfo *>(expr.extra_info_);
const uint64_t cast_mode = enumset_info->cast_mode_;
bool is_strict = CM_IS_STRICT_MODE(cast_mode);
ObObjType out_type = expr.datum_meta_.type_;
ObCollationType out_cs_type = expr.datum_meta_.cs_type_;
ObDatum *val = NULL;
if (ob_is_enum_or_set_type(out_type) && !expr.args_[4]->obj_meta_.is_enum_or_set()) {
if (OB_FAIL(eval_enumset(expr, ctx, val))) {
LOG_WARN("fail to eval enumset result", K(ret));
}
} else {
if (OB_FAIL(expr.args_[4]->eval(ctx, val))) {
LOG_WARN("evaluate parameter failed", K(ret));
}
}
if (OB_FAIL(ret)) {
} else if (val->is_null()) {
datum.set_null();
} else {
// cast is done implictly if needed, before call this function
// 1. cs type validation for string types
// 2. accuracy check and modification
// 3. handle delta lob
if (!is_lob_storage(out_type)) {
if (ob_is_string_type(out_type)) { // in type must not be lob type
ObString str = val->get_string();
if (OB_FAIL(string_collation_check(is_strict, out_cs_type, out_type, str))) {
LOG_WARN("fail to check collation", K(ret), K(str), K(is_strict), K(expr));
} else {
val->set_string(str);
}
} else if (ob_is_enum_or_set_type(out_type)) {
if (OB_FAIL(enum_set_valid_check(val->get_uint64(), enumset_info->str_values_.count(),
(expr.datum_meta_.type_ == ObEnumType)))) {
LOG_WARN("enum set val is invalid", K(ret), K(val->get_uint64()),
K(enumset_info->str_values_.count()), K(expr));
}
}
if (OB_SUCC(ret)
&& OB_FAIL(column_convert_datum_accuracy_check(expr, ctx, false, datum, cast_mode, *val))) {
LOG_WARN("fail do datum_accuracy_check for lob res", K(ret), K(expr), K(*val));
}
if (OB_SUCC(ret)) {
LOG_DEBUG("after column convert", K(expr), K(datum), K(cast_mode));
}
} else if (is_lob_storage(out_type) && expr.args_[4]->obj_meta_.is_user_defined_sql_type()) {
// udt types can only insert to lob columns by rewrite.
// but before rewrite, column convert type deducing may happen
// so prevent the convertion during execution
ret = OB_ERR_INVALID_XML_DATATYPE;
LOG_USER_ERROR(OB_ERR_INVALID_XML_DATATYPE, ob_obj_type_str(out_type), "ANYDATA");
LOG_WARN("convert xmltype to character type is not supported in PL",
K(ret), K(expr.args_[4]->obj_meta_), K(out_type));
} else {
ObObjType in_type = expr.args_[4]->obj_meta_.get_type();
ObCollationType in_cs_type = expr.args_[4]->obj_meta_.get_collation_type();
bool has_lob_header = expr.args_[4]->obj_meta_.has_lob_header();
bool has_lob_header_for_check = has_lob_header;
ObString raw_str = val->get_string();
ObLobLocatorV2 input_lob(raw_str.ptr(), raw_str.length(), has_lob_header);
bool is_delta = input_lob.is_valid() && input_lob.is_delta_temp_lob();
if (is_delta) { // delta lob
if (!(ob_is_text_tc(in_type) || ob_is_json(in_type))) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("delta lob can not convert to non-text type", K(ret), K(out_type));
} else {
datum.set_string(raw_str);
}
} else {
ObEvalCtx::TempAllocGuard tmp_alloc_g(ctx); // temp alloc only used for lob types
common::ObArenaAllocator &temp_allocator = tmp_alloc_g.get_allocator();
ObDatum datum_for_check = *val;
ObString str;
ObTextStringIter striter(in_type, in_cs_type, val->get_string(), has_lob_header);
if (OB_FAIL(striter.init(0, ctx.exec_ctx_.get_my_session(), &temp_allocator))) {
LOG_WARN("fail to init string iter", K(ret), K(is_strict), K(expr));
} else if (OB_FAIL(striter.get_full_data(str))) {
LOG_WARN("fail to get full data from string iter", K(ret), K(is_strict), K(expr));
} else if (ob_is_geometry(out_type)) {
ObGeoType geo_type = ObGeoCastUtils::get_geo_type_from_cast_mode(cast_mode);
if (OB_FAIL(ObGeoTypeUtil::check_geo_type(geo_type, str))) {
LOG_WARN("fail to check geo type", K(ret), K(str), K(geo_type), K(expr));
ret = OB_ERR_CANT_CREATE_GEOMETRY_OBJECT;
LOG_USER_ERROR(OB_ERR_CANT_CREATE_GEOMETRY_OBJECT);
}
} else if (OB_FAIL(string_collation_check(is_strict, out_cs_type, out_type, str))) {
LOG_WARN("fail to check collation", K(ret), K(str), K(is_strict), K(expr));
}
if (OB_SUCC(ret)) {
has_lob_header_for_check = false; // datum_for_check must have no lob header
datum_for_check.set_string(str);
}
if (OB_FAIL(ret)) {
} else if (OB_FAIL(column_convert_datum_accuracy_check(expr, ctx, has_lob_header_for_check, datum,
cast_mode, datum_for_check))) {
LOG_WARN("fail do datum_accuracy_check for lob res", K(ret), K(expr), K(datum_for_check));
} else {
// in type is the same with out type, if length changed, build a new lob
ObLobLocatorV2 loc(raw_str, has_lob_header);
int64_t old_data_byte_len = 0;
if (raw_str.length() > 0) {
if (OB_FAIL(loc.get_lob_data_byte_len(old_data_byte_len))) {
LOG_WARN("Lob: failed to get data byte len", K(ret));
}
}
if (OB_SUCC(ret)) {
int64_t new_data_byte_len = datum.get_string().length();
if (new_data_byte_len == old_data_byte_len) {
datum.set_string(raw_str);
} else {
ObTextStringDatumResult str_result(expr.datum_meta_.type_, &expr, &ctx, &datum);
if (OB_FAIL(str_result.init(new_data_byte_len))) {
LOG_WARN("Lob: init lob result failed", K(ret));
} else if (OB_FAIL(str_result.append(datum.get_string().ptr(), new_data_byte_len))) {
LOG_WARN("Lob: append lob result failed", K(ret));
} else {
str_result.set_result();
}
}
}
}
LOG_DEBUG("after column convert", K(expr), K(datum), K(cast_mode));
}
}
}
}
return ret;
}
int ObExprColumnConv::column_convert_fast(const ObExpr &expr,
ObEvalCtx &ctx,
ObDatum &datum)
{
int ret = OB_SUCCESS;
ObDatum *val = nullptr;
if (OB_FAIL(expr.args_[4]->eval(ctx, val))) {
LOG_WARN("evaluate parameter failed", K(ret));
} else {
datum.set_datum(*val);
}
return ret;
}
int ObExprColumnConv::column_convert_batch(const ObExpr &expr,
ObEvalCtx &ctx,
const ObBitVector &skip,
const int64_t batch_size)
{
int ret = OB_SUCCESS;
ObObjType out_type = expr.datum_meta_.type_;
ObCollationType out_cs_type = expr.datum_meta_.cs_type_;
const ObEnumSetInfo *enumset_info = static_cast<ObEnumSetInfo *>(expr.extra_info_);
const uint64_t cast_mode = enumset_info->cast_mode_;
bool is_strict = CM_IS_STRICT_MODE(cast_mode);
if (OB_FAIL(expr.args_[4]->eval_batch(ctx, skip, batch_size))) {
LOG_WARN("failed to eval batch vals", K(ret));
} else {
ObDatum *vals = expr.args_[4]->locate_batch_datums(ctx);
ObDatum *results = expr.locate_batch_datums(ctx);
ObBitVector &eval_flags = expr.get_evaluated_flags(ctx);
bool is_string_type = ob_is_string_type(out_type);
ObAccuracy accuracy;
accuracy.set_length(expr.max_length_);
accuracy.set_scale(expr.datum_meta_.scale_);
const ObObjTypeClass &dst_tc = ob_obj_type_class(expr.datum_meta_.type_);
const ObLength max_accuracy_len = accuracy.get_length();
if (is_string_type) {
accuracy.set_length_semantics(expr.datum_meta_.length_semantics_);
}
ObEvalCtx::BatchInfoScopeGuard batch_info_guard(ctx);
batch_info_guard.set_batch_size(batch_size);
for (int64_t i = 0; OB_SUCC(ret) && i < batch_size; ++i) {
if (skip.at(i) || eval_flags.at(i)) {
continue;
}
if (vals[i].is_null()) {
results[i].set_null();
} else {
batch_info_guard.set_batch_idx(i);
if (is_string_type) {
ObString str = vals[i].get_string();
if (OB_FAIL(string_collation_check(is_strict, out_cs_type, out_type, str))) {
LOG_WARN("fail to check collation", K(ret), K(str), K(is_strict), K(expr));
} else {
vals[i].set_string(str);
}
}
bool no_need_check_length = is_string_type && max_accuracy_len > 0 && vals[i].len_ < max_accuracy_len;
if (OB_FAIL(ret)) {
} else if (no_need_check_length) {
results[i].set_datum(vals[i]);
} else if (OB_FAIL(column_convert_datum_accuracy_check(expr, ctx, false, results[i], cast_mode, vals[i]))) {
LOG_WARN("fail do datum_accuracy_check for lob res", K(ret), K(expr));
}
}
eval_flags.set(i);
}
}
return ret;
}
int ObExprColumnConv::column_convert_batch_fast(const ObExpr &expr,
ObEvalCtx &ctx,
const ObBitVector &skip,
const int64_t batch_size)
{
int ret = OB_SUCCESS;
if (OB_FAIL(expr.args_[4]->eval_batch(ctx, skip, batch_size))) {
LOG_WARN("failed to eval batch vals", K(ret));
} else {
ObDatum *vals = expr.args_[4]->locate_batch_datums(ctx);
ObDatum *results = expr.locate_batch_datums(ctx);
ObBitVector &eval_flags = expr.get_evaluated_flags(ctx);
for (int64_t i = 0; OB_SUCC(ret) && i < batch_size; ++i) {
if (skip.at(i) || eval_flags.at(i)) {
continue;
}
results[i].set_datum(vals[i]);
eval_flags.set(i);
}
}
return ret;
}
int ObExprColumnConv::eval_enumset(const ObExpr &expr, ObEvalCtx &ctx, common::ObDatum *&datum)
{
int ret = OB_SUCCESS;
const ObEnumSetInfo *enumset_info = static_cast<ObEnumSetInfo *>(expr.extra_info_);
const uint64_t cast_mode = enumset_info->cast_mode_;
const uint64_t expr_ctx_id = static_cast<uint64_t>(expr.expr_ctx_id_);
if (OB_UNLIKELY(expr_ctx_id == ObExpr::INVALID_EXP_CTX_ID)) {
ObExpr *old_expr = expr.args_[0];
expr.args_[0] = expr.args_[4];
if (OB_FAIL(expr.eval_enumset(ctx, enumset_info->str_values_, cast_mode, datum))) {
LOG_WARN("fail to eval_enumset", KPC(enumset_info), K(ret));
}
expr.args_[0] = old_expr;
} else {
ObExprColumnConvCtx *column_conv_ctx = NULL;
if (OB_ISNULL(column_conv_ctx = static_cast<ObExprColumnConvCtx *>
(ctx.exec_ctx_.get_expr_op_ctx(expr_ctx_id)))) {
if (OB_FAIL(ctx.exec_ctx_.create_expr_op_ctx(expr_ctx_id, column_conv_ctx))) {
LOG_WARN("fail to create expr op ctx", K(ret), K(expr_ctx_id));
} else if (OB_FAIL(column_conv_ctx->setup_eval_expr(ctx.exec_ctx_.get_allocator(), expr))) {
LOG_WARN("fail to init column conv ctx", K(ret));
}
}
if (OB_SUCC(ret)) {
if (OB_FAIL(column_conv_ctx->expr_.eval_enumset(ctx, enumset_info->str_values_, cast_mode,
datum))) {
LOG_WARN("fail to eval_enumset", KPC(enumset_info), K(ret));
}
}
}
return ret;
}
int ObExprColumnConv::ObExprColumnConvCtx::setup_eval_expr(ObIAllocator &allocator,
const ObExpr &expr)
{
int ret = OB_SUCCESS;
const int64_t mem_size = sizeof(ObExpr*) * expr.arg_cnt_;
if (OB_ISNULL(args_ = static_cast<ObExpr**>(allocator.alloc(mem_size)))) {
ret = OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("fail to alloc args", K(ret), K(mem_size));
} else {
expr_ = expr;
expr_.args_ = args_;
MEMCPY(args_, expr.args_, mem_size);
args_[0] = args_[4];
}
return ret;
}
//TODO(yaoying.yyy):(duplicate_with_type_to_str, remove later
int ObBaseExprColumnConv::shallow_copy_str_values(const common::ObIArray<common::ObString> &str_values)
{
int ret = OB_SUCCESS;
str_values_.reset();
if (OB_UNLIKELY(str_values.count() < 1)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid str_values", K(str_values), K(ret));
} else if (OB_FAIL(str_values_.assign(str_values))) {
LOG_WARN("fail to assign str values", K(ret));
} else {/*do nothing*/}
return ret;
}
int ObBaseExprColumnConv::deep_copy_str_values(const ObIArray<ObString> &str_values)
{
int ret = OB_SUCCESS;
str_values_.reset();
if (OB_UNLIKELY(str_values.count() < 1)) {
ret = OB_INVALID_ARGUMENT;
LOG_WARN("invalid str_values", K(str_values), K(ret));
} else if (OB_FAIL(str_values_.reserve(str_values.count()))) {
LOG_WARN("fail to init str_values_", K(ret));
} else {/*do nothing*/}
for (int64_t i = 0; OB_SUCC(ret) && i < str_values.count(); ++i) {
const ObString &str = str_values.at(i);
char *buf = NULL;
ObString str_tmp;
if (str.empty()) {
//just keep str_tmp empty
} else if (OB_UNLIKELY(NULL == (buf = static_cast<char *>(alloc_.alloc(str.length()))))) {
ret = common::OB_ALLOCATE_MEMORY_FAILED;
LOG_WARN("failed to allocate memory", K(i), K(str), K(ret));
} else {
MEMCPY(buf, str.ptr(), str.length());
str_tmp.assign_ptr(buf, str.length());
}
if (OB_SUCC(ret)) {
if (OB_FAIL(str_values_.push_back(str_tmp))) {
LOG_WARN("failed to push back str", K(i), K(str_tmp), K(str), K(ret));
}
}
}
return ret;
}
}//sql
}//oceanbase