214 lines
5.7 KiB
C++
214 lines
5.7 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
// This file is copied from
|
|
// https://github.com/ClickHouse/ClickHouse/blob/master/src/Common/Uint128.h
|
|
// and modified by Doris
|
|
|
|
#pragma once
|
|
|
|
#include <iomanip>
|
|
#include <sstream>
|
|
#include <tuple>
|
|
|
|
#include "gutil/hash/city.h"
|
|
#include "gutil/hash/hash128to64.h"
|
|
#include "util/sse_util.hpp"
|
|
#include "vec/core/types.h"
|
|
|
|
namespace doris::vectorized {
|
|
|
|
/// For aggregation by SipHash, UUID type or concatenation of several fields.
|
|
struct UInt128 {
|
|
/// This naming assumes little endian.
|
|
UInt64 low;
|
|
UInt64 high;
|
|
|
|
UInt128() = default;
|
|
explicit UInt128(const UInt64 low_, const UInt64 high_) : low(low_), high(high_) {}
|
|
explicit UInt128(const UInt64 rhs) : low(rhs), high() {}
|
|
|
|
auto tuple() const { return std::tie(high, low); }
|
|
|
|
String to_hex_string() const {
|
|
std::ostringstream os;
|
|
os << std::setw(16) << std::setfill('0') << std::hex << high << low;
|
|
return String(os.str());
|
|
}
|
|
|
|
bool operator==(const UInt128 rhs) const { return tuple() == rhs.tuple(); }
|
|
auto operator<=>(const UInt128 rhs) const { return tuple() <=> rhs.tuple(); }
|
|
|
|
UInt128 operator<<(const UInt128& rhs) const {
|
|
const uint64_t shift = rhs.low;
|
|
if (((bool)rhs.high) || (shift >= 128)) {
|
|
return UInt128(0);
|
|
} else if (shift == 64) {
|
|
return UInt128(0, low);
|
|
} else if (shift == 0) {
|
|
return *this;
|
|
} else if (shift < 64) {
|
|
return UInt128(low << shift, (high << shift) + (low >> (64 - shift)));
|
|
} else if ((128 > shift) && (shift > 64)) {
|
|
return UInt128(0, low << (shift - 64));
|
|
} else {
|
|
return UInt128(0);
|
|
}
|
|
}
|
|
|
|
UInt128& operator<<=(const UInt128& rhs) {
|
|
*this = *this << rhs;
|
|
return *this;
|
|
}
|
|
|
|
UInt128 operator+(const UInt128& rhs) const {
|
|
return UInt128(low + rhs.low, high + rhs.high + ((low + rhs.low) < low));
|
|
}
|
|
|
|
UInt128& operator+=(const UInt128& rhs) {
|
|
high += rhs.high + ((low + rhs.low) < low);
|
|
low += rhs.low;
|
|
return *this;
|
|
}
|
|
|
|
template <typename T>
|
|
bool operator==(const T rhs) const {
|
|
return *this == UInt128(rhs);
|
|
}
|
|
template <typename T>
|
|
auto operator<=>(const T rhs) const {
|
|
return *this <=> UInt128(rhs);
|
|
}
|
|
|
|
template <typename T>
|
|
explicit operator T() const {
|
|
return static_cast<T>(low);
|
|
}
|
|
|
|
UInt128& operator=(const UInt64 rhs) {
|
|
low = rhs;
|
|
high = 0;
|
|
return *this;
|
|
}
|
|
|
|
operator uint128_t() const {
|
|
uint128_t value = static_cast<uint128_t>(high) << 64;
|
|
value |= low;
|
|
return value;
|
|
}
|
|
};
|
|
|
|
template <>
|
|
inline constexpr bool IsNumber<UInt128> = true;
|
|
template <>
|
|
struct TypeName<UInt128> {
|
|
static const char* get() { return "UInt128"; }
|
|
};
|
|
template <>
|
|
struct TypeId<UInt128> {
|
|
static constexpr const TypeIndex value = TypeIndex::UInt128;
|
|
};
|
|
|
|
struct UInt128Hash {
|
|
size_t operator()(UInt128 x) const { return Hash128to64({x.low, x.high}); }
|
|
};
|
|
|
|
#if defined(__SSE4_2__) || defined(__aarch64__)
|
|
|
|
struct UInt128HashCRC32 {
|
|
size_t operator()(const UInt128& x) const {
|
|
UInt64 crc = -1ULL;
|
|
crc = _mm_crc32_u64(crc, x.low);
|
|
crc = _mm_crc32_u64(crc, x.high);
|
|
return crc;
|
|
}
|
|
};
|
|
|
|
#else
|
|
|
|
/// On other platforms we do not use CRC32. NOTE This can be confusing.
|
|
struct UInt128HashCRC32 : public UInt128Hash {};
|
|
|
|
#endif
|
|
|
|
struct UInt128TrivialHash {
|
|
size_t operator()(UInt128 x) const { return x.low; }
|
|
};
|
|
|
|
/** Used for aggregation, for putting a large number of constant-length keys in a hash table.
|
|
*/
|
|
struct UInt256 {
|
|
UInt64 a;
|
|
UInt64 b;
|
|
UInt64 c;
|
|
UInt64 d;
|
|
|
|
bool operator==(const UInt256 rhs) const {
|
|
return a == rhs.a && b == rhs.b && c == rhs.c && d == rhs.d;
|
|
}
|
|
|
|
bool operator==(const UInt64 rhs) const { return a == rhs && b == 0 && c == 0 && d == 0; }
|
|
|
|
UInt256& operator=(const UInt64 rhs) {
|
|
a = rhs;
|
|
b = 0;
|
|
c = 0;
|
|
d = 0;
|
|
return *this;
|
|
}
|
|
};
|
|
|
|
#pragma pack(1)
|
|
struct UInt136 {
|
|
UInt8 a;
|
|
UInt64 b;
|
|
UInt64 c;
|
|
|
|
bool operator==(const UInt136 rhs) const { return a == rhs.a && b == rhs.b && c == rhs.c; }
|
|
};
|
|
#pragma pack()
|
|
|
|
} // namespace doris::vectorized
|
|
|
|
/// Overload hash for type casting
|
|
template <>
|
|
struct std::hash<doris::vectorized::UInt128> {
|
|
size_t operator()(const doris::vectorized::UInt128& u) const {
|
|
return Hash128to64({u.low, u.high});
|
|
}
|
|
};
|
|
|
|
template <>
|
|
struct std::is_signed<doris::vectorized::UInt128> {
|
|
static constexpr bool value = false;
|
|
};
|
|
|
|
template <>
|
|
struct std::is_unsigned<doris::vectorized::UInt128> {
|
|
static constexpr bool value = true;
|
|
};
|
|
|
|
template <>
|
|
struct std::is_integral<doris::vectorized::UInt128> {
|
|
static constexpr bool value = true;
|
|
};
|
|
|
|
// Operator +, -, /, *, % aren't implemented, so it's not an arithmetic type
|
|
template <>
|
|
struct std::is_arithmetic<doris::vectorized::UInt128> {
|
|
static constexpr bool value = false;
|
|
};
|