doris/be/src/vec/core/field.h

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.
// This file is copied from
// https://github.com/ClickHouse/ClickHouse/blob/master/src/Core/Field.h
// and modified by Doris

#pragma once

#include <fmt/format.h>
#include <glog/logging.h>
#include <stdint.h>
#include <string.h>

#include <algorithm>
#include <cassert>
#include <functional>
#include <map>
#include <new>
#include <ostream>
#include <string>
#include <string_view>
#include <type_traits>
#include <utility>
#include <vector>

// IWYU pragma: no_include <opentelemetry/common/threadlocal.h>
#include "common/compiler_util.h" // IWYU pragma: keep
#include "olap/hll.h"
#include "util/bitmap_value.h"
#include "util/quantile_state.h"
#include "vec/common/uint128.h"
#include "vec/core/types.h"

namespace doris {
namespace vectorized {
template <typename T>
struct TypeId;
template <typename T>
struct TypeName;
} // namespace vectorized
struct PackedInt128;
} // namespace doris

namespace doris::vectorized {

template <typename T>
struct NearestFieldTypeImpl {
    using Type = T;
};

template <typename T>
using NearestFieldType = typename NearestFieldTypeImpl<T>::Type;

template <typename T>
struct AvgNearestFieldTypeTrait {
    using Type = typename NearestFieldTypeImpl<T>::Type;
};

template <>
struct AvgNearestFieldTypeTrait<Decimal32> {
    using Type = Decimal128I;
};

template <>
struct AvgNearestFieldTypeTrait<Decimal64> {
    using Type = Decimal128I;
};

template <>
struct AvgNearestFieldTypeTrait<Decimal128> {
    using Type = Decimal128;
};

template <>
struct AvgNearestFieldTypeTrait<Decimal128I> {
    using Type = Decimal128;
};

template <>
struct AvgNearestFieldTypeTrait<Int64> {
    using Type = double;
};

class Field;

using FieldVector = std::vector<Field>;

/// Array and Tuple use the same storage type -- FieldVector, but we declare
/// distinct types for them, so that the caller can choose whether it wants to
/// construct a Field of Array or a Tuple type. An alternative approach would be
/// to construct both of these types from FieldVector, and have the caller
/// specify the desired Field type explicitly.
#define DEFINE_FIELD_VECTOR(X)          \
    struct X : public FieldVector {     \
        using FieldVector::FieldVector; \
    }

DEFINE_FIELD_VECTOR(Array);
DEFINE_FIELD_VECTOR(Tuple);
DEFINE_FIELD_VECTOR(Map);
#undef DEFINE_FIELD_VECTOR

using FieldMap = std::map<String, Field, std::less<String>>;
#define DEFINE_FIELD_MAP(X)       \
    struct X : public FieldMap {  \
        using FieldMap::FieldMap; \
    }
DEFINE_FIELD_MAP(VariantMap);
#undef DEFINE_FIELD_MAP

class JsonbField {
public:
    JsonbField() = default;

    JsonbField(const char* ptr, uint32_t len) : size(len) {
        data = new char[size];
        if (!data) {
            LOG(FATAL) << "new data buffer failed, size: " << size;
        }
        memcpy(data, ptr, size);
    }

    JsonbField(const JsonbField& x) : size(x.size) {
        data = new char[size];
        if (!data) {
            LOG(FATAL) << "new data buffer failed, size: " << size;
        }
        memcpy(data, x.data, size);
    }

    JsonbField(JsonbField&& x) : data(x.data), size(x.size) {
        x.data = nullptr;
        x.size = 0;
    }

    JsonbField& operator=(const JsonbField& x) {
        data = new char[size];
        if (!data) {
            LOG(FATAL) << "new data buffer failed, size: " << size;
        }
        memcpy(data, x.data, size);
        return *this;
    }

    JsonbField& operator=(JsonbField&& x) {
        if (data) {
            delete[] data;
        }
        data = x.data;
        size = x.size;
        x.data = nullptr;
        x.size = 0;
        return *this;
    }

    ~JsonbField() {
        if (data) {
            delete[] data;
        }
    }

    const char* get_value() const { return data; }
    uint32_t get_size() const { return size; }

    bool operator<(const JsonbField& r) const {
        LOG(FATAL) << "comparing between JsonbField is not supported";
    }
    bool operator<=(const JsonbField& r) const {
        LOG(FATAL) << "comparing between JsonbField is not supported";
    }
    bool operator==(const JsonbField& r) const {
        LOG(FATAL) << "comparing between JsonbField is not supported";
    }
    bool operator>(const JsonbField& r) const {
        LOG(FATAL) << "comparing between JsonbField is not supported";
    }
    bool operator>=(const JsonbField& r) const {
        LOG(FATAL) << "comparing between JsonbField is not supported";
    }
    bool operator!=(const JsonbField& r) const {
        LOG(FATAL) << "comparing between JsonbField is not supported";
    }

    const JsonbField& operator+=(const JsonbField& r) {
        LOG(FATAL) << "Not support plus opration on JsonbField";
    }

    const JsonbField& operator-=(const JsonbField& r) {
        LOG(FATAL) << "Not support minus opration on JsonbField";
    }

private:
    char* data = nullptr;
    uint32_t size = 0;
};

template <typename T>
bool decimal_equal(T x, T y, UInt32 x_scale, UInt32 y_scale);
template <typename T>
bool decimal_less(T x, T y, UInt32 x_scale, UInt32 y_scale);
template <typename T>
bool decimal_less_or_equal(T x, T y, UInt32 x_scale, UInt32 y_scale);

template <typename T>
class DecimalField {
public:
    DecimalField(T value, UInt32 scale_) : dec(value), scale(scale_) {}

    operator T() const { return dec; }
    T get_value() const { return dec; }
    T get_scale_multiplier() const;
    UInt32 get_scale() const { return scale; }

    template <typename U>
    bool operator<(const DecimalField<U>& r) const {
        using MaxType = std::conditional_t<(sizeof(T) > sizeof(U)), T, U>;
        return decimal_less<MaxType>(dec, r.get_value(), scale, r.get_scale());
    }

    template <typename U>
    bool operator<=(const DecimalField<U>& r) const {
        using MaxType = std::conditional_t<(sizeof(T) > sizeof(U)), T, U>;
        return decimal_less_or_equal<MaxType>(dec, r.get_value(), scale, r.get_scale());
    }

    template <typename U>
    bool operator==(const DecimalField<U>& r) const {
        using MaxType = std::conditional_t<(sizeof(T) > sizeof(U)), T, U>;
        return decimal_equal<MaxType>(dec, r.get_value(), scale, r.get_scale());
    }

    template <typename U>
    bool operator>(const DecimalField<U>& r) const {
        return r < *this;
    }
    template <typename U>
    bool operator>=(const DecimalField<U>& r) const {
        return r <= *this;
    }
    template <typename U>
    bool operator!=(const DecimalField<U>& r) const {
        return !(*this == r);
    }

    const DecimalField<T>& operator+=(const DecimalField<T>& r) {
        if (scale != r.get_scale()) {
            LOG(FATAL) << "Add different decimal fields";
        }
        dec += r.get_value();
        return *this;
    }

    const DecimalField<T>& operator-=(const DecimalField<T>& r) {
        if (scale != r.get_scale()) {
            LOG(FATAL) << "Sub different decimal fields";
        }
        dec -= r.get_value();
        return *this;
    }

private:
    T dec;
    UInt32 scale;
};

/** 32 is enough. Round number is used for alignment and for better arithmetic inside std::vector.
  * NOTE: Actually, sizeof(std::string) is 32 when using libc++, so Field is 40 bytes.
  */
#define DBMS_MIN_FIELD_SIZE 32

/** Discriminated union of several types.
  * Made for replacement of `boost::variant`
  *  is not generalized,
  *  but somewhat more efficient, and simpler.
  *
  * Used to represent a single value of one of several types in memory.
  * Warning! Prefer to use chunks of columns instead of single values. See Column.h
  */
class Field {
public:
    struct Types {
        /// Type tag.
        enum Which {
            Null = 0,
            UInt64 = 1,
            Int64 = 2,
            Float64 = 3,
            UInt128 = 4,
            Int128 = 5,
            FixedLengthObject = 6,

            /// Non-POD types.

            String = 16,
            Array = 17,
            Tuple = 18,
            Decimal32 = 19,
            Decimal64 = 20,
            Decimal128 = 21,
            AggregateFunctionState = 22,
            JSONB = 23,
            Decimal128I = 24,
            Map = 25,
            VariantMap = 26,
            Bitmap = 27,
            HyperLogLog = 28,
            QuantileState = 29,
        };

        static const int MIN_NON_POD = 16;

        static const char* to_string(Which which) {
            switch (which) {
            case Null:
                return "Null";
            case UInt64:
                return "UInt64";
            case UInt128:
                return "UInt128";
            case Int64:
                return "Int64";
            case Int128:
                return "Int128";
            case Float64:
                return "Float64";
            case String:
                return "String";
            case JSONB:
                return "JSONB";
            case Array:
                return "Array";
            case Tuple:
                return "Tuple";
            case Map:
                return "Map";
            case Decimal32:
                return "Decimal32";
            case Decimal64:
                return "Decimal64";
            case Decimal128:
                return "Decimal128";
            case Decimal128I:
                return "Decimal128I";
            case FixedLengthObject:
                return "FixedLengthObject";
            case VariantMap:
                return "VariantMap";
            case Bitmap:
                return "Bitmap";
            case HyperLogLog:
                return "HyperLogLog";
            case QuantileState:
                return "QuantileState";
            default:
                LOG(FATAL) << "type not supported, type=" << Types::to_string(which);
                break;
            }
        }
    };

    /// Returns an identifier for the type or vice versa.
    template <typename T>
    struct TypeToEnum;
    template <Types::Which which>
    struct EnumToType;

    static bool is_decimal(Types::Which which) {
        return (which >= Types::Decimal32 && which <= Types::Decimal128) ||
               which == Types::Decimal128I;
    }

    Field() : which(Types::Null) {}

    // set Types::Null explictly and avoid other types
    Field(Types::Which w) : which(w) { DCHECK_EQ(Types::Null, which); }

    /** Despite the presence of a template constructor, this constructor is still needed,
      *  since, in its absence, the compiler will still generate the default constructor.
      */
    Field(const Field& rhs) { create(rhs); }

    Field(Field&& rhs) { create(std::move(rhs)); }

    template <typename T>
        requires(!std::is_same_v<std::decay_t<T>, Field>)
    Field(T&& rhs);

    /// Create a string inplace.
    Field(const char* data, size_t size) { create(data, size); }

    Field(const unsigned char* data, size_t size) { create(data, size); }

    /// NOTE In case when field already has string type, more direct assign is possible.
    void assign_string(const char* data, size_t size) {
        destroy();
        create(data, size);
    }

    void assign_string(const unsigned char* data, size_t size) {
        destroy();
        create(data, size);
    }

    void assign_jsonb(const char* data, size_t size) {
        destroy();
        create_jsonb(data, size);
    }

    void assign_jsonb(const unsigned char* data, size_t size) {
        destroy();
        create_jsonb(data, size);
    }

    Field& operator=(const Field& rhs) {
        if (this != &rhs) {
            if (which != rhs.which) {
                destroy();
                create(rhs);
            } else
                assign(rhs); /// This assigns string or vector without deallocation of existing buffer.
        }
        return *this;
    }

    Field& operator=(Field&& rhs) {
        if (this != &rhs) {
            if (which != rhs.which) {
                destroy();
                create(std::move(rhs));
            } else
                assign(std::move(rhs));
        }
        return *this;
    }

    template <typename T>
        requires(!std::is_same_v<std::decay_t<T>, Field>)
    Field& operator=(T&& rhs);

    ~Field() { destroy(); }

    Types::Which get_type() const { return which; }
    const char* get_type_name() const { return Types::to_string(which); }

    bool is_null() const { return which == Types::Null; }

    template <typename T>
    T& get() {
        using TWithoutRef = std::remove_reference_t<T>;
        TWithoutRef* MAY_ALIAS ptr = reinterpret_cast<TWithoutRef*>(&storage);
        return *ptr;
    }

    template <typename T>
    const T& get() const {
        using TWithoutRef = std::remove_reference_t<T>;
        const TWithoutRef* MAY_ALIAS ptr = reinterpret_cast<const TWithoutRef*>(&storage);
        return *ptr;
    }

    template <typename T>
    bool try_get(T& result) {
        const Types::Which requested = TypeToEnum<std::decay_t<T>>::value;
        if (which != requested) return false;
        result = get<T>();
        return true;
    }

    template <typename T>
    bool try_get(T& result) const {
        const Types::Which requested = TypeToEnum<std::decay_t<T>>::value;
        if (which != requested) return false;
        result = get<T>();
        return true;
    }

    template <typename T>
    T& safe_get() {
        const Types::Which requested = TypeToEnum<std::decay_t<T>>::value;
        CHECK_EQ(which, requested) << fmt::format("Bad get: has {}, requested {}", get_type_name(),
                                                  Types::to_string(requested));
        return get<T>();
    }

    template <typename T>
    const T& safe_get() const {
        const Types::Which requested = TypeToEnum<std::decay_t<T>>::value;
        CHECK_EQ(which, requested) << fmt::format("Bad get: has {}, requested {}", get_type_name(),
                                                  Types::to_string(requested));
        return get<T>();
    }

    bool operator==(const Field& rhs) const {
        return operator<=>(rhs) == std::strong_ordering::equal;
    }

    std::strong_ordering operator<=>(const Field& rhs) const {
        if (which == Types::Null || rhs == Types::Null) {
            return std::strong_ordering::equal;
        }
        if (which != rhs.which) {
            LOG(FATAL) << "lhs type not equal with rhs, lhs=" << Types::to_string(which)
                       << ", rhs=" << Types::to_string(rhs.which);
        }

        switch (which) {
        case Types::Bitmap:
        case Types::HyperLogLog:
        case Types::QuantileState:
        case Types::FixedLengthObject:
        case Types::JSONB:
        case Types::Null:
        case Types::Array:
        case Types::Tuple:
        case Types::Map:
        case Types::VariantMap:
            return std::strong_ordering::equal;
        case Types::UInt64:
            return get<UInt64>() <=> rhs.get<UInt64>();
        case Types::UInt128:
            return get<UInt128>() <=> rhs.get<UInt128>();
        case Types::Int64:
            return get<Int64>() <=> rhs.get<Int64>();
        case Types::Int128:
            return get<Int128>() <=> rhs.get<Int128>();
        case Types::Float64:
            return get<Float64>() < rhs.get<Float64>()    ? std::strong_ordering::less
                   : get<Float64>() == rhs.get<Float64>() ? std::strong_ordering::equal
                                                          : std::strong_ordering::greater;
        case Types::String:
            return get<String>() <=> rhs.get<String>();
        case Types::Decimal32:
            return get<Decimal32>() <=> rhs.get<Decimal32>();
        case Types::Decimal64:
            return get<Decimal64>() <=> rhs.get<Decimal64>();
        case Types::Decimal128:
            return get<Decimal128>() <=> rhs.get<Decimal128>();
        case Types::Decimal128I:
            return get<Decimal128I>() <=> rhs.get<Decimal128I>();
        default:
            LOG(FATAL) << "lhs type not equal with rhs, lhs=" << Types::to_string(which)
                       << ", rhs=" << Types::to_string(rhs.which);
            break;
        }
    }

private:
    std::aligned_union_t<DBMS_MIN_FIELD_SIZE - sizeof(Types::Which), Null, UInt64, UInt128, Int64,
                         Int128, Float64, String, JsonbField, Array, Tuple, Map, VariantMap,
                         DecimalField<Decimal32>, DecimalField<Decimal64>, DecimalField<Decimal128>,
                         DecimalField<Decimal128I>, BitmapValue, HyperLogLog, QuantileState>
            storage;

    Types::Which which;

    /// Assuming there was no allocated state or it was deallocated (see destroy).
    template <typename T>
    void create_concrete(T&& x) {
        using UnqualifiedType = std::decay_t<T>;

        // In both Field and PODArray, small types may be stored as wider types,
        // e.g. char is stored as UInt64. Field can return this extended value
        // with get<StorageType>(). To avoid uninitialized results from get(),
        // we must initialize the entire wide stored type, and not just the
        // nominal type.
        using StorageType = NearestFieldType<UnqualifiedType>;
        new (&storage) StorageType(std::forward<T>(x));
        which = TypeToEnum<UnqualifiedType>::value;
    }

    /// Assuming same types.
    template <typename T>
    void assign_concrete(T&& x) {
        using JustT = std::decay_t<T>;
        assert(which == TypeToEnum<JustT>::value);
        JustT* MAY_ALIAS ptr = reinterpret_cast<JustT*>(&storage);
        *ptr = std::forward<T>(x);
    }

    template <typename F,
              typename Field> /// Field template parameter may be const or non-const Field.
    static void dispatch(F&& f, Field& field) {
        switch (field.which) {
        case Types::Null:
            f(field.template get<Null>());
            return;
        case Types::UInt64:
            f(field.template get<UInt64>());
            return;
        case Types::UInt128:
            f(field.template get<UInt128>());
            return;
        case Types::Int64:
            f(field.template get<Int64>());
            return;
        case Types::Int128:
            f(field.template get<Int128>());
            return;
        case Types::Float64:
            f(field.template get<Float64>());
            return;
        case Types::String:
            f(field.template get<String>());
            return;
        case Types::JSONB:
            f(field.template get<JsonbField>());
            return;
        case Types::Array:
            f(field.template get<Array>());
            return;
        case Types::Tuple:
            f(field.template get<Tuple>());
            return;
        case Types::Map:
            f(field.template get<Map>());
            return;
        case Types::Decimal32:
            f(field.template get<DecimalField<Decimal32>>());
            return;
        case Types::Decimal64:
            f(field.template get<DecimalField<Decimal64>>());
            return;
        case Types::Decimal128:
            f(field.template get<DecimalField<Decimal128>>());
            return;
        case Types::Decimal128I:
            f(field.template get<DecimalField<Decimal128I>>());
            return;
        case Types::VariantMap:
            f(field.template get<VariantMap>());
            return;
        case Types::Bitmap:
            f(field.template get<BitmapValue>());
            return;
        case Types::HyperLogLog:
            f(field.template get<HyperLogLog>());
            return;
        case Types::QuantileState:
            f(field.template get<QuantileState>());
            return;
        default:
            LOG(FATAL) << "type not supported, type=" << Types::to_string(field.which);
            break;
        }
    }

    void create(const Field& x) {
        dispatch([this](auto& value) { create_concrete(value); }, x);
    }

    void create(Field&& x) {
        dispatch([this](auto& value) { create_concrete(std::move(value)); }, x);
    }

    void assign(const Field& x) {
        dispatch([this](auto& value) { assign_concrete(value); }, x);
    }

    void assign(Field&& x) {
        dispatch([this](auto& value) { assign_concrete(std::move(value)); }, x);
    }

    void create(const char* data, size_t size) {
        new (&storage) String(data, size);
        which = Types::String;
    }

    void create(const unsigned char* data, size_t size) {
        create(reinterpret_cast<const char*>(data), size);
    }

    void create_jsonb(const char* data, size_t size) {
        new (&storage) JsonbField(data, size);
        which = Types::JSONB;
    }

    void create_jsonb(const unsigned char* data, size_t size) {
        new (&storage) JsonbField(reinterpret_cast<const char*>(data), size);
        which = Types::JSONB;
    }

    ALWAYS_INLINE void destroy() {
        if (which < Types::MIN_NON_POD) return;

        switch (which) {
        case Types::String:
            destroy<String>();
            break;
        case Types::JSONB:
            destroy<JsonbField>();
            break;
        case Types::Array:
            destroy<Array>();
            break;
        case Types::Tuple:
            destroy<Tuple>();
            break;
        case Types::Map:
            destroy<Map>();
            break;
        case Types::VariantMap:
            destroy<VariantMap>();
            break;
        default:
            break;
        }

        which = Types::
                Null; /// for exception safety in subsequent calls to destroy and create, when create fails.
    }

    template <typename T>
    void destroy() {
        T* MAY_ALIAS ptr = reinterpret_cast<T*>(&storage);
        ptr->~T();
    }
};

#undef DBMS_MIN_FIELD_SIZE

template <>
struct TypeId<Tuple> {
    static constexpr const TypeIndex value = TypeIndex::Tuple;
};
template <>
struct TypeId<DecimalField<Decimal32>> {
    static constexpr const TypeIndex value = TypeIndex::Decimal32;
};
template <>
struct TypeId<DecimalField<Decimal64>> {
    static constexpr const TypeIndex value = TypeIndex::Decimal64;
};
template <>
struct TypeId<DecimalField<Decimal128>> {
    static constexpr const TypeIndex value = TypeIndex::Decimal128;
};
template <>
struct TypeId<DecimalField<Decimal128I>> {
    static constexpr const TypeIndex value = TypeIndex::Decimal128I;
};
template <>
struct Field::TypeToEnum<Null> {
    static constexpr Types::Which value = Types::Null;
};
template <>
struct Field::TypeToEnum<UInt64> {
    static constexpr Types::Which value = Types::UInt64;
};
template <>
struct Field::TypeToEnum<UInt128> {
    static constexpr Types::Which value = Types::UInt128;
};
template <>
struct Field::TypeToEnum<Int64> {
    static constexpr Types::Which value = Types::Int64;
};
template <>
struct Field::TypeToEnum<Int128> {
    static constexpr Types::Which value = Types::Int128;
};
template <>
struct Field::TypeToEnum<Float64> {
    static constexpr Types::Which value = Types::Float64;
};
template <>
struct Field::TypeToEnum<String> {
    static constexpr Types::Which value = Types::String;
};
template <>
struct Field::TypeToEnum<JsonbField> {
    static const Types::Which value = Types::JSONB;
};
template <>
struct Field::TypeToEnum<Array> {
    static constexpr Types::Which value = Types::Array;
};
template <>
struct Field::TypeToEnum<Tuple> {
    static constexpr Types::Which value = Types::Tuple;
};
template <>
struct Field::TypeToEnum<Map> {
    static const Types::Which value = Types::Map;
};
template <>
struct Field::TypeToEnum<DecimalField<Decimal32>> {
    static constexpr Types::Which value = Types::Decimal32;
};
template <>
struct Field::TypeToEnum<DecimalField<Decimal64>> {
    static constexpr Types::Which value = Types::Decimal64;
};
template <>
struct Field::TypeToEnum<DecimalField<Decimal128>> {
    static constexpr Types::Which value = Types::Decimal128;
};
template <>
struct Field::TypeToEnum<DecimalField<Decimal128I>> {
    static constexpr Types::Which value = Types::Decimal128I;
};
template <>
struct Field::TypeToEnum<VariantMap> {
    static constexpr Types::Which value = Types::VariantMap;
};

template <>
struct Field::TypeToEnum<BitmapValue> {
    static constexpr Types::Which value = Types::Bitmap;
};

template <>
struct Field::TypeToEnum<HyperLogLog> {
    static constexpr Types::Which value = Types::HyperLogLog;
};

template <>
struct Field::TypeToEnum<QuantileState> {
    static constexpr Types::Which value = Types::QuantileState;
};

template <>
struct Field::EnumToType<Field::Types::Null> {
    using Type = Null;
};
template <>
struct Field::EnumToType<Field::Types::UInt64> {
    using Type = UInt64;
};
template <>
struct Field::EnumToType<Field::Types::UInt128> {
    using Type = UInt128;
};
template <>
struct Field::EnumToType<Field::Types::Int64> {
    using Type = Int64;
};
template <>
struct Field::EnumToType<Field::Types::Int128> {
    using Type = Int128;
};
template <>
struct Field::EnumToType<Field::Types::Float64> {
    using Type = Float64;
};
template <>
struct Field::EnumToType<Field::Types::String> {
    using Type = String;
};
template <>
struct Field::EnumToType<Field::Types::JSONB> {
    using Type = JsonbField;
};
template <>
struct Field::EnumToType<Field::Types::Array> {
    using Type = Array;
};
template <>
struct Field::EnumToType<Field::Types::Tuple> {
    using Type = Tuple;
};
template <>
struct Field::EnumToType<Field::Types::Map> {
    using Type = Map;
};
template <>
struct Field::EnumToType<Field::Types::Decimal32> {
    using Type = DecimalField<Decimal32>;
};
template <>
struct Field::EnumToType<Field::Types::Decimal64> {
    using Type = DecimalField<Decimal64>;
};
template <>
struct Field::EnumToType<Field::Types::Decimal128> {
    using Type = DecimalField<Decimal128>;
};
template <>
struct Field::EnumToType<Field::Types::Decimal128I> {
    using Type = DecimalField<Decimal128I>;
};
template <>
struct Field::EnumToType<Field::Types::VariantMap> {
    using Type = VariantMap;
};

template <typename T>
T get(const Field& field) {
    return field.template get<T>();
}

template <typename T>
T get(Field& field) {
    return field.template get<T>();
}

template <typename T>
T safe_get(const Field& field) {
    return field.template safe_get<T>();
}

template <typename T>
T safe_get(Field& field) {
    return field.template safe_get<T>();
}

template <>
struct TypeName<Array> {
    static std::string get() { return "Array"; }
};
template <>
struct TypeName<Tuple> {
    static std::string get() { return "Tuple"; }
};

template <>
struct TypeName<VariantMap> {
    static std::string get() { return "VariantMap"; }
};
template <>
struct TypeName<Map> {
    static std::string get() { return "Map"; }
};

/// char may be signed or unsigned, and behave identically to signed char or unsigned char,
///  but they are always three different types.
/// signedness of char is different in Linux on x86 and Linux on ARM.
template <>
struct NearestFieldTypeImpl<char> {
    using Type = std::conditional_t<std::is_signed_v<char>, Int64, UInt64>;
};
template <>
struct NearestFieldTypeImpl<signed char> {
    using Type = Int64;
};
template <>
struct NearestFieldTypeImpl<unsigned char> {
    using Type = Int64;
};

template <>
struct NearestFieldTypeImpl<UInt16> {
    using Type = UInt64;
};
template <>
struct NearestFieldTypeImpl<UInt32> {
    using Type = UInt64;
};

template <>
struct NearestFieldTypeImpl<Int16> {
    using Type = Int64;
};
template <>
struct NearestFieldTypeImpl<Int32> {
    using Type = Int64;
};

/// long and long long are always different types that may behave identically or not.
/// This is different on Linux and Mac.
template <>
struct NearestFieldTypeImpl<long> {
    using Type = Int64;
};

template <>
struct NearestFieldTypeImpl<Decimal32> {
    using Type = DecimalField<Decimal32>;
};
template <>
struct NearestFieldTypeImpl<Decimal64> {
    using Type = DecimalField<Decimal64>;
};
template <>
struct NearestFieldTypeImpl<Decimal128> {
    using Type = DecimalField<Decimal128>;
};
template <>
struct NearestFieldTypeImpl<Decimal128I> {
    using Type = DecimalField<Decimal128I>;
};
template <>
struct NearestFieldTypeImpl<DecimalField<Decimal32>> {
    using Type = DecimalField<Decimal32>;
};
template <>
struct NearestFieldTypeImpl<DecimalField<Decimal64>> {
    using Type = DecimalField<Decimal64>;
};
template <>
struct NearestFieldTypeImpl<DecimalField<Decimal128>> {
    using Type = DecimalField<Decimal128>;
};
template <>
struct NearestFieldTypeImpl<DecimalField<Decimal128I>> {
    using Type = DecimalField<Decimal128I>;
};
template <>
struct NearestFieldTypeImpl<Float32> {
    using Type = Float64;
};
template <>
struct NearestFieldTypeImpl<const char*> {
    using Type = String;
};
template <>
struct NearestFieldTypeImpl<bool> {
    using Type = UInt64;
};

template <>
struct NearestFieldTypeImpl<std::string_view> {
    using Type = String;
};

template <>
struct Field::TypeToEnum<PackedInt128> {
    static const Types::Which value = Types::Int128;
};

template <>
struct NearestFieldTypeImpl<PackedInt128> {
    using Type = Int128;
};

template <typename T>
decltype(auto) cast_to_nearest_field_type(T&& x) {
    using U = NearestFieldType<std::decay_t<T>>;
    if constexpr (std::is_same_v<PackedInt128, std::decay_t<T>>) {
        return U(x.value);
    } else if constexpr (std::is_same_v<std::decay_t<T>, U>) {
        return std::forward<T>(x);
    } else {
        return U(x);
    }
}

/// This (rather tricky) code is to avoid ambiguity in expressions like
/// Field f = 1;
/// instead of
/// Field f = Int64(1);
/// Things to note:
/// 1. float <--> int needs explicit cast
/// 2. customized types needs explicit cast
template <typename T>
    requires(!std::is_same_v<std::decay_t<T>, Field>)
Field::Field(T&& rhs) {
    auto&& val = cast_to_nearest_field_type(std::forward<T>(rhs));
    create_concrete(std::forward<decltype(val)>(val));
}

template <typename T>
    requires(!std::is_same_v<std::decay_t<T>, Field>)
Field& Field::operator=(T&& rhs) {
    auto&& val = cast_to_nearest_field_type(std::forward<T>(rhs));
    using U = decltype(val);
    if (which != TypeToEnum<std::decay_t<U>>::value) {
        destroy();
        create_concrete(std::forward<U>(val));
    } else {
        assign_concrete(std::forward<U>(val));
    }

    return *this;
}

} // namespace doris::vectorized