doris/be/src/runtime/decimal_value.cpp

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#include "runtime/decimal_value.h"

#include <algorithm>
#include <iostream>
#include <utility>

namespace doris {

const char* DecimalValue::_s_llvm_class_name = "class.doris::DecimalValue";

// set the 1st param if the second param is smaller.
template<typename T> inline void set_if_smaller(T* num1_ptr, const T num2) {
    if (*num1_ptr > num2) {
        *num1_ptr = num2;
    }
}

// set the 1st param if the second param is smaller.
template<typename T> inline void set_if_bigger(T* num1_ptr, const T num2) {
    if (*num1_ptr < num2) {
        *num1_ptr = num2;
    }
}

// util function: check if there is error and fix it.
inline void fix_intg_frac_error(
        const int32_t len,
        int32_t* int_len,
        int32_t* frac_len,
        int32_t* error) {
    if (*int_len + *frac_len > len) {
        if (*int_len > len) {
            *int_len = len;
            *frac_len = 0;
            *error = E_DEC_OVERFLOW;
        } else {
            *frac_len = len - *int_len;
            *error = E_DEC_TRUNCATED;
        }
    } else {
        *error = E_DEC_OK;
    }
}

// Note: the carry <= 1, so for the sum of three number(value1, value2, *carry),
//      the maximum value of carry is 1.
inline void add(const int32_t value1, const int32_t value2, int32_t* to, int32_t* carry) {
    int32_t sum = value1 + value2 + *carry;
    *carry = (sum >= DIG_BASE) ? 1 : 0;
    if (*carry) {
        sum -= DIG_BASE;
    }
    *to = sum;
}

// to = value1 - value2
inline void sub(const int32_t value1, const int32_t value2, int32_t* to, int32_t* carry) {
    int32_t a = value1 - value2 - *carry ;
    *carry = (a < 0) ? 1 : 0;
    if (*carry) {
        a += DIG_BASE;
    }
    *to = a;
}

// Note: the input carry may > 1, after the summation process of three number (value1, value2, *carry),
//      the maximum value of carry may be 2, when sum() >= 2 * DIG_BASE.
inline void add2(const int32_t value1, const int32_t value2, int32_t* to, int32_t* carry) {
    // NOTE: When three int32_t integers (the maximum value of each number is 10 ^ 9 - 1) are added,
    // because the maximum value of int32_t is 2147483647, the result may overflow, so it is
    // necessary to convert int32_t to int64_t.
    int64_t sum = (int64_t) value1 + value2 + *carry;
    *carry = (sum >= DIG_BASE) ? 1 : 0;
    if (*carry) {
        sum -= DIG_BASE;
    }
    if (sum >= DIG_BASE) {
        sum -= DIG_BASE;
        ++(*carry);
    }
    // the value of sum must small than DIG_BASE here
    *to = (int32_t) sum;
}

// to = value1 - value2 ƒ
inline void sub2(const int32_t value1, const int32_t value2, int32_t* to, int32_t* carry) {
    int32_t a = value1 - value2 - *carry ;
    *carry = (a < 0) ? 1 : 0;
    if (*carry) {
        a += DIG_BASE;
    }
    if (a < 0) {
        a += DIG_BASE;
        ++(*carry);
    }
    *to = a;
}

int32_t do_add(
        const DecimalValue& value1,
        const DecimalValue& value2,
        DecimalValue* to) {
    int32_t intg1 = round_up(value1._int_length);
    int32_t intg2 = round_up(value2._int_length);
    int32_t frac1 = round_up(value1._frac_length);
    int32_t frac2 = round_up(value2._frac_length);
    int32_t frac0 = std::max(frac1, frac2);
    int32_t intg0 = std::max(intg1, intg2);

    // Is there a need for extra word because of carry?
    int32_t first_big_digit_sum = intg1 > intg2 ? value1._buffer[0] :
        intg2 > intg1 ? value2._buffer[0] :
        value1._buffer[0] + value2._buffer[0];
    if (first_big_digit_sum > DIG_MAX - 1) {
        // yes, there is
        ++intg0;
        to->_buffer[0] = 0; // for safety
    }

    to->_sign = value1._sign;

    int32_t error = E_DEC_OK;
    fix_intg_frac_error(to->_buffer_length, &intg0, &frac0, &error);
    if (error == E_DEC_OVERFLOW) {
        to->to_max_decimal(to->_buffer_length * DIG_PER_DEC1, 0);
        return error;
    }

    int32_t *buf0 = to->_buffer + intg0 + frac0;
    to->_int_length = intg0 * DIG_PER_DEC1;
    to->_frac_length = std::max(value1._frac_length, value2._frac_length);
    if (error) { // E_DEC_TRUNCATED
        int32_t to_frac_length = to->_frac_length;
        //ATTN: _int_lenggh is bit-field struct member, can not take address directly.
        set_if_smaller(&to_frac_length, frac0 * DIG_PER_DEC1);
        to->_frac_length = to_frac_length;
        set_if_smaller(&frac1, frac0);
        set_if_smaller(&frac2, frac0);
        set_if_smaller(&intg1, intg0);
        set_if_smaller(&intg2, intg0);
    }

    // part 1 - max(frac) ... min (frac)
    const int32_t *buf1 = nullptr;
    const int32_t *buf2 = nullptr;
    const int32_t *stop = nullptr;
    const int32_t *stop2 = nullptr;
    if (frac1 > frac2) {
        buf1 = value1._buffer + intg1 + frac1;
        stop = value1._buffer + intg1 + frac2;
        buf2 = value2._buffer + intg2 + frac2;
        stop2 = value1._buffer + ((intg1 > intg2) ? (intg1 - intg2) : 0);
    } else {
        buf1 = value2._buffer + intg2 + frac2;
        stop = value2._buffer + intg2 + frac1;
        buf2 = value1._buffer + intg1 + frac1;
        stop2 = value2._buffer + ((intg2 > intg1) ? (intg2 - intg1) : 0);
    }
    while (buf1 > stop) {
        *--buf0 = *--buf1;
    }

    // part 2 - min(frac) ... min(intg)
    int32_t carry = 0;
    while (buf1 > stop2) {
        add(*--buf1, *--buf2, --buf0, &carry);
    }

    // part 3 - min(intg) ... max(intg)
    if (intg1 > intg2) {
        stop = value1._buffer;
        buf1 = stop + intg1 - intg2;
    } else {
        stop = value2._buffer;
        buf1 = stop + intg2 - intg1;
    }
    while (buf1 > stop) {
        add(*--buf1, 0, --buf0, &carry);
    }

    if (carry) {
        *--buf0 = 1;
    }

    return error;
}

// to=value1-value2.
// if to==0, return -1/0/+1 - the result of the comparison
int do_sub(const DecimalValue& value1, const DecimalValue& value2, DecimalValue *to) {
    int32_t intg1 = round_up(value1._int_length);
    int32_t intg2 = round_up(value2._int_length);
    int32_t frac1 = round_up(value1._frac_length);
    int32_t frac2 = round_up(value2._frac_length);
    int32_t frac0 = std::max(frac1, frac2);
    int32_t error = E_DEC_OK;
    int32_t carry = 0;

    // let carry:=1 if value2 > value1
    // TODO(lingbin): add another variable 'is_bigger' to replace 'carry' to make carry only
    //                has one meaning
    const int32_t* buf1 = value1._buffer;
    const int32_t* start1 = buf1;
    const int32_t* stop1 = buf1 + intg1;
    const int32_t* buf2 = value2._buffer;
    const int32_t* start2 = buf2;
    const int32_t* stop2 = buf2 + intg2;
    // ignore leading zeroes
    if (*buf1 == 0) {
        while (buf1 < stop1 && *buf1 == 0) {
            buf1++;
        }
        start1 = buf1;
        intg1 = (int32_t) (stop1 - buf1);
    }
    if (*buf2 == 0) {
        while (buf2 < stop2 && *buf2 == 0) {
            buf2++;
        }
        start2 = buf2;
        intg2 = (int32_t) (stop2 - buf2);
    }
    if (intg2 > intg1) {
        carry = 1;
    } else if (intg2 == intg1) {
        const int32_t *end1 = stop1 + (frac1 - 1);
        const int32_t *end2 = stop2 + (frac2 - 1);
        // ignore trailing zeroes
        while ((buf1 <= end1) && (*end1 == 0)) {
            end1--;
        }
        while ((buf2 <= end2) && (*end2 == 0)) {
            end2--;
        }

        frac1 = (int32_t) (end1 - stop1) + 1;
        frac2 = (int32_t) (end2 - stop2) + 1;
        while (buf1 <= end1 && buf2 <= end2 && *buf1 == *buf2) {
            buf1++;
            buf2++;
        }

        if (buf1 <= end1) {
            if (buf2 <= end2) { // not equal
                carry = (*buf2 > *buf1);
            } else { // value1 is longer, so value1 > value2
                carry = 0;
            }
        } else {
            if (buf2 <= end2){ // value2 is longer
                carry = 1;
            } else { // short-circuit everything: value1 == value2
                if (to == nullptr) {// for decimal_cmp()
                    return 0;
                }
                to->set_to_zero();
                return E_DEC_OK;
            }
        }
    }

    if (to == nullptr) { // decimal_cmp(), not equal
        return (carry == value1._sign) ? 1 : -1;
    }

    to->_sign = value1._sign;

    DecimalValue value_big = value1;
    DecimalValue value_small = value2;

    // ensure that always value1 > value2 (and intg1 >= intg2)
    if (carry) {
        std::swap(value_big, value_small);
        std::swap(start1, start2);
        std::swap(intg1, intg2);
        std::swap(frac1, frac2);
        to->_sign = 1 - to->_sign;
    }

    fix_intg_frac_error(to->_buffer_length, &intg1, &frac0, &error);
    int32_t* buf0 = to->_buffer + intg1 + frac0;

    to->_frac_length = std::max(value_big._frac_length, value_small._frac_length);
    to->_int_length = intg1 * DIG_PER_DEC1;
    if (error) { // must be E_DEC_TRUNCATE.
        int32_t temp_to_frac_length = to->_frac_length;
        set_if_smaller(&temp_to_frac_length, frac0 * DIG_PER_DEC1);
        to->_frac_length = temp_to_frac_length;

        set_if_smaller(&frac1, frac0);
        set_if_smaller(&frac2, frac0);
        set_if_smaller(&intg2, intg1);
    }
    carry = 0;

    // part 1 - max(frac) ... min (frac)
    if (frac1 > frac2) {
        buf1 = start1 + intg1 + frac1;
        stop1 = start1 + intg1 + frac2;
        buf2 = start2 + intg2 + frac2;
        while (frac0-- > frac1) { //occur when there are trailing zeroes
            *--buf0 = 0;
        }
        while (buf1 > stop1) {
            *--buf0 = *--buf1;
        }
    } else {
        buf1 = start1 + intg1 + frac1;
        buf2 = start2 + intg2 + frac2;
        stop2 = start2 + intg2 + frac1;
        while (frac0-- > frac2) {
            *--buf0 = 0;
        }
        while (buf2 > stop2) {
            sub(0, *--buf2, --buf0, &carry);
        }
    }

    // part 2 - min(frac) ... intg2
    while (buf2 > start2) {
        sub(*--buf1, *--buf2, --buf0, &carry);
    }

    // part 3 - intg2 ... intg1 */
    while (carry && buf1 > start1) {
        sub(*--buf1, 0, --buf0, &carry);
    }

    while (buf1 > start1) {
        *--buf0 = *--buf1;
    }

    while (buf0 > to->_buffer) { // TODO(lingbin): will not happen?
        *--buf0 = 0;
    }

    return error;
}

// multiply two decimals
// @return E_DEC_OK/E_DEC_TRUNCATED/E_DEC_OVERFLOW;
//
// NOTE:
//  in this implementation, with sizeof(big_digit_type)=4 we have DIG_PER_DEC1=9,
//  and 63-digit number will take only 7 big_digit_type words (basically a 7-digit
//  "base 999999999" number).  Thus there's no need in fast multiplication
//  algorithms, 7-digit numbers can be multiplied with a naive O(n*n)
//  method.
//  XXX if this library is to be used with huge numbers of thousands of
//  digits, fast multiplication must be implemented.
int do_mul(const DecimalValue& value1, const DecimalValue& value2, DecimalValue* to) {
    int32_t intg1 = round_up(value1._int_length);
    int32_t intg2 = round_up(value2._int_length);
    int32_t frac1 = round_up(value1._frac_length);
    int32_t frac2 = round_up(value2._frac_length);
    int32_t intg0 = round_up(value1._int_length + value2._int_length);
    int32_t frac0 = frac1 + frac2;
    int32_t error = E_DEC_OK;

    const int32_t* buf1 = value1._buffer + intg1;
    const int32_t* buf2 = value2._buffer + intg2;

    // If E_DEC_OVERFLOW, save 'ideal' values. Note that no need to calculate fraction now.
    int32_t temp_intg = intg0;
    // if E_DEC_TRUNCATE, use to
    int32_t temp_frac = frac0;
    fix_intg_frac_error(to->_buffer_length, &intg0, &frac0, &error);  // bound size
    to->_sign = (value1._sign != value2._sign) ? true : false;
    to->_int_length = intg0 * DIG_PER_DEC1;
    to->_frac_length = value1._frac_length + value2._frac_length; // store size in digits

    int32_t temp_to_frac_length = to->_frac_length;
    //ATTN: _int_lenggh is bit-field struct member, can not take address directly.
    set_if_smaller(&temp_to_frac_length, NOT_FIXED_DEC);
    to->_frac_length = temp_to_frac_length;
    if (error) {
        int32_t temp_to_int_length = to->_int_length;
        set_if_smaller(&temp_to_int_length, intg0 * DIG_PER_DEC1);
        to->_int_length = temp_to_int_length;

        int32_t temp_to_frac_length = to->_frac_length;
        set_if_smaller(&temp_to_frac_length, frac0 * DIG_PER_DEC1);
        to->_frac_length = temp_to_frac_length;

        if (temp_intg > intg0) { // bounded integer-part, E_DEC_OVERFLOW
            temp_intg -= intg0;
            temp_frac = temp_intg >> 1;
            intg1 -= temp_frac;
            intg2 -= temp_intg - temp_frac;
            frac1 = frac2 = 0; // frac0 is already 0 here
        } else { // bounded fract part, E_DEC_TRUNCATE
            temp_frac -= frac0;
            temp_intg = temp_frac >> 1;
            if (frac1 <= frac2) {
                frac1 -= temp_intg;
                frac2 -= temp_frac - temp_intg;
            } else {
                frac2 -= temp_intg;
                frac1 -= temp_frac - temp_intg;
            }
        }
    }
    int32_t* start0 = to->_buffer + intg0 + frac0 - 1;
    const int32_t* start2 = buf2 + frac2 - 1;
    const int32_t* stop1 = buf1 - intg1;
    const int32_t* stop2 = buf2 - intg2;
    int32_t* buf0 = nullptr;
    int32_t carry = 0;

    memset(to->_buffer, 0, (intg0 + frac0) * sizeof(int32_t));
    for (buf1 += frac1 - 1; buf1 >= stop1; buf1--, start0--) {
        carry = 0;
        for (buf0 = start0, buf2 = start2; buf2 >= stop2; buf2--, buf0--) {
            int64_t mul_result = ((int64_t) *buf1)
                    * ((int64_t) *buf2);
            int32_t high = (int32_t) (mul_result / DIG_BASE);
            int32_t low =
                    (int32_t) (mul_result - ((int64_t)high) * DIG_BASE);
            add2(*buf0, low, buf0, &carry);
            carry += high;
        }
        if (carry) {
            if (buf0 < to->_buffer) {
                return E_DEC_OVERFLOW;
            }
            add2(*buf0, 0, buf0, &carry);
        }
        // may carry again.
        for (buf0--; carry; buf0--) {
            if (buf0 < to->_buffer) {
                return E_DEC_OVERFLOW;
            }
            add2(*buf0, 0, buf0, &carry);
        }
    }

    // Now we have to check for '-0.000' case
    if (to->_sign) {
        int32_t *buf = to->_buffer;
        int32_t *end = to->_buffer + intg0 + frac0;
        for (;buf < end; ++buf) {
            if (*buf) {
                break;
            }
        }
        if (buf == end) {
            // We got decimal zero
            to->set_to_zero();
        }
    }

    // remove leading zeros.
    buf1 = to->_buffer;
    int32_t d_to_move = intg0 + round_up(to->_frac_length);
    while ((*buf1 == 0) && (to->_int_length > DIG_PER_DEC1)) {
        ++buf1;
        to->_int_length -= DIG_PER_DEC1;
        d_to_move--;
    }
    if (to->_buffer < buf1) {
        int32_t *cur_d = to->_buffer;
        for (; d_to_move--; cur_d++, buf1++) {
            *cur_d = *buf1;
        }
    }

    return error;
}

// if N1/N2 mod==NULL; if N1%N2 to==NULL;
int do_div_mod(
            const DecimalValue& value1,
            const DecimalValue& value2,
            DecimalValue* to,
            DecimalValue* mod) {
    int32_t frac1 = round_up(value1._frac_length) * DIG_PER_DEC1;
    int32_t frac2 = round_up(value2._frac_length) * DIG_PER_DEC1;
    int32_t prec1 = value1._int_length + frac1;
    int32_t prec2 = value2._int_length + frac2;
    int32_t error = E_DEC_OK;

    if (mod) {
        to = mod;
    }

    const int32_t* buff1 = value1._buffer;
    const int32_t* buff2 = value2._buffer;

#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Warray-bounds"
    // removing all the leading zeros
    // process value2
    int32_t first_big_digit_length = (prec2 - 1) % DIG_PER_DEC1 + 1;
    while (prec2 > 0 && *buff2 == 0) {
        prec2 -= first_big_digit_length;
        first_big_digit_length = DIG_PER_DEC1;
        ++buff2;
    }
    if (prec2 <= 0) { // short-circuit everything, value2 == 0
        return E_DEC_DIV_ZERO;
    }
    first_big_digit_length = (prec2 - 1) % DIG_PER_DEC1 + 1;
    for (; *buff2 < powers10[--first_big_digit_length];) {
        --prec2;
    }

    // process value1
    first_big_digit_length = (prec1 - 1) % DIG_PER_DEC1 + 1;
    while (prec1 > 0 && *buff1 == 0) {
        prec1 -= first_big_digit_length;
        first_big_digit_length = DIG_PER_DEC1;
        ++buff1;
    }
    if (prec1 <= 0) { // short-circuit everything, value1 == 0
        to->set_to_zero();
        return E_DEC_OK;
    }
    first_big_digit_length = (prec1 - 1) % DIG_PER_DEC1 + 1;
    for (; *buff1 < powers10[--first_big_digit_length];) {
        --prec1;
    }
#pragma GCC diagnostic pop

    // 比较两个数的整形部分，得到结果的intg。 如果被除数较小，intg=0.
    int32_t dintg = (prec1 - frac1) - (prec2 - frac2) + (*buff1 >= *buff2);
    int32_t intg0 = 0; // big digit length
    int32_t frac0 = 0;
    if (dintg < 0) {
        dintg /= DIG_PER_DEC1;
        intg0 = 0;
    } else {
        intg0 = round_up(dintg);
    }

    if (mod) {
        // we are calculating N1 % N2. The result will have
        //  1) frac = max(frac1, frac2), as for subtraction
        //  2) intg = intg2.
        to->_sign = value1._sign;
        to->_frac_length = std::max(value1._frac_length, value2._frac_length);
        frac0 = 0;
    } else {
        // we are calculating N1/N2.
        // N1 is in the buff1, has prec1 digits; N2 is in the buff2, has prec2 digits.
        // Scales are frac1 and frac2 accordingly.
        // Thus, the result will have
        //  1) frac = round_up(frac1 + frac2)
        //  2) intg = (prec1 - frac1) - (prec2 - frac2) + 1
        //  3) prec = intg + frac

        frac0 = round_up(frac1 + frac2);
        if (frac0 == 0) {
            frac0 = 1;
        }
        fix_intg_frac_error(to->_buffer_length, &intg0, &frac0, &error);

        to->_sign = (value1._sign != value2._sign);
        to->_int_length = intg0 * DIG_PER_DEC1;
        to->_frac_length = frac0 * DIG_PER_DEC1;
    }

    int32_t* buff0 = to->_buffer;
    int32_t* stop0 = buff0 + intg0 + frac0;
    int32_t div_mod = !(mod); // true when do div, false when do mod.
    if (div_mod) { // do div
        while (dintg++ < 0 && buff0 < &(to->_buffer[to->_buffer_length])) {
            *buff0++ = 0;
        }
    }

    int32_t i = round_up(prec1);
    int32_t len1 = i + round_up(2 * frac2 + 1) + 1;
    set_if_bigger(&len1, 3);
    int32_t* tmp1 = new (std::nothrow) int32_t[len1 * sizeof(int32_t)];
    if (tmp1 == nullptr) {
        return E_DEC_OOM;
    }
    memcpy(tmp1, buff1, i * sizeof(int32_t));
    memset(tmp1 + i, 0, (len1 - i) * sizeof(int32_t));

    int32_t* start1 = tmp1;
    int32_t* stop1 = start1 + len1;
    const int32_t* start2 = buff2;
    const int32_t* stop2 = buff2 + round_up(prec2) - 1;

    // removing end zeroes
    while (*stop2 == 0 && stop2 >= start2) {
        --stop2;
    }
    int32_t len2 = (int32_t)((stop2++) - start2);

    // calculating norm2 (normalized *start2) - we need *start2 to be large
    // (at least > DIG_BASE/2), but unlike Knuth's Alg. D we don't want to
    // normalize input numbers (as we don't make a copy of the divisor).
    // Thus we normalize first big_digit_type of buf2 only, and we'll normalize *start1
    // on the fly for the purpose of guesstimation only.
    // It's also faster, as we're saving on normalization of buf2
    int64_t norm_factor = DIG_BASE / (*start2 + 1);
    int32_t norm2 = (int32_t)(norm_factor * start2[0]);
    if (len2 > 0) {
        norm2 += (int32_t)(norm_factor * start2[1] / DIG_BASE);
    }

    int32_t dcarry;
    if (*start1 < *start2) {
        dcarry = *start1++;
    } else {
        dcarry = 0;
    }

    int64_t guess = 0;
    // main loop
    for (; buff0 < stop0; buff0++) {
        // short-circuit, if possible
        if (dcarry == 0 && *start1 < *start2) {
            guess = 0;
        } else {
            // D3: make a guess
            int64_t x = start1[0] + ((int64_t)dcarry) * DIG_BASE;
            int64_t y = start1[1];
            guess = (norm_factor * x + norm_factor * y / DIG_BASE) / norm2;
            if (guess >= DIG_BASE) {
                guess = DIG_BASE - 1;
            }
            if (len2 > 0) {
                // hmm, this is a suspicious trick - I removed normalization here
                if (start2[1] * guess > (x - guess * start2[0]) * DIG_BASE + y) {
                    guess--;
                }
                if (start2[1] * guess > (x - guess * start2[0]) * DIG_BASE + y){
                    guess--;
                }
            }

            // D4: multiply and subtract
            buff2 = stop2;
            int32_t* temp_prt = start1 + len2;
            int32_t carry = 0;
            for (; buff2 > start2; --temp_prt) {
                int32_t high;
                int32_t low;
                x = guess * (*--buff2);
                high = (int32_t)(x / DIG_BASE);
                low = (int32_t)(x - ((int64_t)high) * DIG_BASE);
                sub2(*temp_prt, low, temp_prt, &carry);
                carry += high;
            }
            carry = dcarry < carry;

            // D5: check the remainder
            if (carry) {
                // D6: correct the guess
                guess--;
                buff2 = stop2;
                temp_prt = start1 + len2;
                for (carry = 0; buff2 > start2; temp_prt--) {
                    add(*temp_prt, *--buff2, temp_prt, &carry);
                }
            }
        }
        if (div_mod) {
            *buff0 = (int32_t)guess;
        }
        dcarry = *start1;
        ++start1;
    }

    do{
        if (mod) {
        // now the result is in tmp1, it has
        //  intg=prec1-frac1
        //  frac=max(frac1, frac2)=to->frac
            if (dcarry) {
                *--start1 = dcarry;
            }
            buff0 = to->_buffer;
            intg0 = (int) (round_up(prec1 - frac1) - (start1 - tmp1));
            frac0 = round_up(to->_frac_length);
            error = E_DEC_OK;
            if (frac0 == 0 && intg0 == 0) {
                to->set_to_zero();
                break;
            }
            if (intg0 <= 0) {
                if (-intg0 >= to->_buffer_length) {
                    error = E_DEC_TRUNCATED;
                    to->set_to_zero();
                    break;
                }
                stop1 = start1 + frac0 + intg0;
                frac0 += intg0;
                to->_int_length = 0;
                while (intg0++ < 0) {
                    *buff0++ = 0;
                }
            } else {
                if (intg0 > to->_buffer_length) {
                    frac0 = 0;
                    intg0 = to->_buffer_length;
                    error = E_DEC_OVERFLOW;
                    break;
                }
                stop1 = start1 + frac0 + intg0;
                to->_int_length = std::min(intg0 * DIG_PER_DEC1, (int) value2._int_length);
            }
            if (intg0 + frac0 > to->_buffer_length) {
                stop1 -= frac0 + intg0 - to->_buffer_length;
                frac0 = to->_buffer_length - intg0;
                to->_frac_length = frac0 * DIG_PER_DEC1;
                error = E_DEC_TRUNCATED;
            }
            while (start1 < stop1) {
                *buff0++ = *start1++;
            }
        }
    }while(0);

    delete[] tmp1;
    int32_t to_int_length = 0;
    const int32_t* first_no_zero = to->get_first_no_zero_index(&to_int_length);
    to->_int_length = to_int_length;
    if (to->_buffer != first_no_zero) {
        memmove(to->_buffer, first_no_zero,
            (round_up(to->_int_length) + round_up(to->_frac_length)) * sizeof(int32_t));
    }
    return error;
}

// TODO(lingbin): if ignore do_add's error code
DecimalValue operator+(const DecimalValue& v1, const DecimalValue& v2) {
    DecimalValue result;
    if (v1._sign == v2._sign) {
        do_add(v1, v2, &result);
    } else {
        do_sub(v1, v2, &result);
    }
    return result;
}

DecimalValue operator-(const DecimalValue& v1, const DecimalValue& v2) {
    DecimalValue result;
    if (v1._sign == v2._sign) {
        do_sub(v1, v2, &result);
    } else {
        do_add(v1, v2, &result);
    }
    return result;
}

DecimalValue operator*(const DecimalValue& v1, const DecimalValue& v2){
    DecimalValue result;
    do_mul(v1, v2, &result);
    return result;
}

DecimalValue operator/(const DecimalValue& v1, const DecimalValue& v2){
    DecimalValue result;
    do_div_mod(v1, v2, &result, nullptr);
    return result;
}

DecimalValue operator%(const DecimalValue& v1, const DecimalValue& v2){
    DecimalValue result;
    do_div_mod(v1, v2, nullptr, &result);
    return result;
}

std::ostream& operator<<(std::ostream& os, DecimalValue const& decimal_value) {
    return os << decimal_value.to_string();
}

std::istream& operator>>(std::istream& ism, DecimalValue& decimal_value) {
    std::string str_buff;
    ism >> str_buff;
    decimal_value.parse_from_str(str_buff.c_str(), str_buff.size());
    return ism;
}

DecimalValue operator-(const DecimalValue& v) {
    DecimalValue result = v;
    result._sign = !result._sign;
    return result;
}

DecimalValue& DecimalValue::operator+=(const DecimalValue& other) {
    *this = *this + other;
    return *this;
}

int DecimalValue::parse_from_str(const char* decimal_str, int32_t length) {
    set_to_zero();
    const char* begin = decimal_str;
    const char* end = decimal_str + length;
    int32_t error = E_DEC_OK;

    // ignore leading spaces
    while (begin < end && std::isspace(*begin)) {
        ++begin;
    }
    if (begin == end) {
        set_to_zero();
        return E_DEC_BAD_NUM;
    }

    // positive or negative
    if (*begin == '-') {
        _sign = true;
        ++begin;
    } else if (*begin == '+') {
        _sign = false;
        ++begin;
    } else {
        _sign = false;
    }

    // count int_length and frac_length
    const char* temp_ptr = begin;
    const char* frac_ptr = nullptr;
    // after this loop, 'begin' point to the first non digital position
    while (begin < end && std::isdigit(*begin)) {
        ++begin;
    }
    int32_t int_len = (int32_t) (begin - temp_ptr);
    int32_t frac_len = 0;
    if (begin < end && *begin == '.') {
        frac_ptr = begin + 1;
        while (frac_ptr < end && std::isdigit(*frac_ptr)) {
            ++frac_ptr;
        }
        frac_len = frac_ptr - begin - 1;  // -1 for char '.'
    } else {
        frac_len = 0;
        frac_ptr = begin;
    }

    // bad num like "  a"
    if ((int_len + frac_len) == 0) {
        set_to_zero();
        return E_DEC_BAD_NUM;
    }

    int32_t int_big_digit_len = round_up(int_len);
    int32_t frac_big_digit_len = round_up(frac_len);
    fix_intg_frac_error(_buffer_length, &int_big_digit_len, &frac_big_digit_len, &error);
    if (error) {
        frac_len = frac_big_digit_len * DIG_PER_DEC1;
        if (error == E_DEC_OVERFLOW) {
            int_len = int_big_digit_len * DIG_PER_DEC1;
        }
    }

    _int_length = int_len;
    _frac_length = frac_len;
    temp_ptr = begin;

    // fill int value
    int32_t* buff = _buffer + int_big_digit_len;
    int32_t value = 0;
    int32_t index_in_powers10 = 0;
    for (; int_len > 0; --int_len) {
        value += (*--temp_ptr - '0') * powers10[index_in_powers10];
        ++index_in_powers10;
        if (index_in_powers10 == DIG_PER_DEC1) {
            *--buff = value;
            value = 0;
            index_in_powers10 = 0;
        }
    }
    if (index_in_powers10) {
        *--buff = value;
    }

    // fill fraction value
    buff = _buffer + int_big_digit_len;
    temp_ptr = begin;
    for (value = 0, index_in_powers10 = 0; frac_len > 0; --frac_len) {
        value = (*++temp_ptr - '0') + value * 10;
        ++index_in_powers10;
        if (index_in_powers10 == DIG_PER_DEC1) {
            *buff++ = value;
            value = 0;
            index_in_powers10 = 0;
        }
    }
    if (index_in_powers10) {
        *buff = value * powers10[DIG_PER_DEC1 - index_in_powers10];
    }

    // TODO: we do not support decimal in scientific notation
    if ((frac_ptr + 1) < end && (*frac_ptr == 'e' || *frac_ptr == 'E')) {
        // return E_DEC_BAD_NUM;
        int64_t exponent = strtoll(frac_ptr + 1, (char**) &end, 10);
        if (end != frac_ptr + 1) { // If at least one digit
            if (errno) { // system error number, it is thread local
                set_to_zero();
                return E_DEC_BAD_NUM;
            }
            if (exponent > (INT_MAX / 2) || (errno == 0 && exponent < 0)) {
                set_to_zero();
                return E_DEC_OVERFLOW;
            }
            if (exponent < INT_MAX / 2 && error != E_DEC_OVERFLOW) {
                set_to_zero();
                return E_DEC_TRUNCATED;
            }
            if (error != E_DEC_OVERFLOW) {
                // error = shift((int32_t) exponent);
            }
        }
    }
    if (_sign && is_zero()) {
        _sign = false;
    }
    return error;
}

// TODO(lingbin): should be refactored with to_string(int scale)
std::string DecimalValue::to_string() const {
    // Ignore trailing zeroes
    int32_t intg = round_up(_int_length);
    int32_t frac = round_up(_frac_length);
    const int32_t* frac_begin = _buffer + intg;
    const int32_t* frac_end = frac_begin + (frac - 1);

    const int32_t* buff = frac_end;
    while ((buff < frac_end) && (*buff == 0)) {
        --buff;
    }

    int32_t actual_frac = (int32_t) (buff - frac_begin) + 1;
    int32_t actual_frac_len = actual_frac * DIG_PER_DEC1;

    // Count the number of zeroes at the end of last "big digit" number
    if (actual_frac_len > 0) {
        int32_t last_big_digit = *buff;
        while ((last_big_digit > 0) && (last_big_digit % 10) == 0) {
            --actual_frac_len;
            last_big_digit /= 10;
        }
    }

    return to_string(actual_frac_len);
}

std::string DecimalValue::to_string(int scale) const {
    int32_t temp_intg = _int_length;
    int32_t temp_frac = _frac_length;
    if (temp_frac > scale) {
        temp_frac = scale;
    }
    const int32_t* buff_no_zero = get_first_no_zero_index(&temp_intg);

    int32_t temp = 0;
    if ((temp_intg + temp_frac) == 0) {
        temp_intg = 1;
        buff_no_zero = &temp;
    }

    int32_t int_str_length = temp_intg;
    if (temp_intg == 0) {
        int_str_length = 1;
    }
    int32_t length = (_sign ? 1 : 0)
        + int_str_length + (temp_frac ? 1 : 0) + temp_frac;

    char result_str[DECIMAL_MAX_STR_LENGTH + 1];
    char* result_ptr = result_str;

    result_ptr[length] = '\0';
    if (_sign) {
        *result_ptr++ = '-';
    }
    if (temp_frac) {
        char* char_point = result_ptr + int_str_length;
        int32_t fill_length = scale - temp_frac;
        const int32_t* buff = buff_no_zero + round_up(temp_intg);
        *char_point++ = '.';
        for (; temp_frac > 0; temp_frac -= DIG_PER_DEC1) {
            int32_t m = *buff++;
            for (int32_t i = std::min(temp_frac, DIG_PER_DEC1); i; --i) {
                int32_t n = m / DIG_MASK;
                *char_point++ = '0' + n;
                m -= n * DIG_MASK;
                m *= 10;
            }
        }
        while (fill_length-- > 0) {
            *result_ptr = '0'; // use char '0' to fill
        }
    }

    if (temp_intg) {
        char* char_point = result_ptr + int_str_length;
        const int32_t* buff = buff_no_zero + round_up(temp_intg);
        for (; temp_intg > 0; temp_intg -= DIG_PER_DEC1) {
            int32_t m = *--buff;
            for (int32_t i = std::min(temp_intg, DIG_PER_DEC1); i; --i) {
                int32_t n = m / 10;
                *--char_point = '0' + (m - n * 10);
                m = n;
            }
        }
    } else {
        *result_ptr = '0';
    }

    return std::string(result_str, length);
}

// NOTE: only change abstract value, do not change sign
void DecimalValue::to_max_decimal(int32_t precision, int32_t frac) {
    int32_t *buf = _buffer;

    _int_length = precision - frac;
    int32_t intpart = precision - frac;
    if (intpart) {
        int32_t firstdigits = intpart % DIG_PER_DEC1;
        if (firstdigits) {
            *buf++ = powers10[firstdigits] - 1; // get 9 99 999 ...
        }
        for (intpart /= DIG_PER_DEC1; intpart; intpart--) {
            *buf++ = DIG_MAX;
        }
    }

    _frac_length = frac;
    if (frac) {
        int32_t lastdigits = frac % DIG_PER_DEC1;
        for (frac /= DIG_PER_DEC1; frac; frac--) {
            *buf++ = DIG_MAX;
        }
        if (lastdigits) {
            *buf = frac_max[lastdigits - 1];
        }
    }
}

std::size_t hash_value(DecimalValue const& value) {
    return value.hash(0);
}

int DecimalValue::round(DecimalValue *to, int scale, DecimalRoundMode mode) {
    int frac0 = scale > 0 ? round_up(scale) : (scale + 1) / DIG_PER_DEC1;
    int frac1 = round_up(_frac_length);
    int intg0 = round_up(_int_length);
    int error = E_DEC_OK;
    int len = _buffer_length;

    int32_t* buf0 = _buffer;
    int32_t* buf1 = to->_buffer;
    int32_t x = 0;
    int32_t y = 0;
    int32_t carry = 0;
    int first_dig = 0;

    int round_digit = 0;
    switch (mode) {
    case HALF_UP:
    case HALF_EVEN:
        round_digit = 5;
        break;
    case CEILING:
        round_digit = _sign ? 10 : 0;
        break;
    case FLOOR:
        round_digit = _sign ? 0 : 10;
        break;
    case TRUNCATE:
        round_digit = 10;
        break;
    default:
        return E_DEC_ERROR;
    }

    // input is too large, make it meaningful
    if (frac0 + intg0 > len) {
        frac0 = len - intg0;
        scale = frac0 * DIG_PER_DEC1;
        error = E_DEC_TRUNCATED;
    }
    // zero
    if (scale + _int_length < 0) {
        to->set_to_zero();
        return E_DEC_OK;
    }
    // normal case copy
    if (to != this) {
        int32_t *p0 = buf0 + intg0 + std::max(frac1, frac0);
        int32_t *p1 = buf1 + intg0 + std::max(frac1, frac0);

        while (buf0 < p0) {
            *(--p1) = *(--p0);
        }

        buf0 = to->_buffer;
        buf1 = to->_buffer;
        to->_sign = _sign;
        to->_int_length = std::min(intg0, len) * DIG_PER_DEC1;
    }
    // no need to trunk
    if (frac0 > frac1) {
        buf1 += intg0 + frac1;
        while (frac0-- > frac1) {
            *buf1++ = 0;
        }
        to->_frac_length = scale;
        return error;
    }
    if (scale >= _frac_length) {
        /* nothing to do */
        to->_frac_length = scale;
        return error;
    }

    buf0 += intg0 + frac0 - 1;
    buf1 += intg0 + frac0 - 1;
    if (scale == frac0 * DIG_PER_DEC1) {
        bool do_inc = false;
        switch (round_digit) {
        case 0: {
            int32_t* p0 = buf0 + (frac1 - frac0);
            for (; p0 > buf0; p0--) {
                if (*p0) {
                    do_inc = true;
                    break;
                }
            }
            break;
        }
        case 5: {
            x = buf0[1] / DIG_MASK;
            do_inc = (x > 5)
                || ((x == 5) && (mode == HALF_UP || (frac0 + intg0 > 0 && *buf0 & 1)));
            break;
        }
        default:
            break;
        }
        if (do_inc) {
            if (frac0 + intg0 > 0) {
                (*buf1)++;
            } else {
                *(++buf1) = DIG_BASE;
            }
        } else if (frac0 + intg0 == 0) {
            to->set_to_zero();
            return E_DEC_OK;
        }
    } else {
        /* TODO - fix this code as it won't work for CEILING mode */
        int pos = frac0 * DIG_PER_DEC1 - scale - 1;
        x = *buf1 / powers10[pos];
        y = x % 10;
        if (y > round_digit
                || (round_digit == 5 && y == 5 && (mode == HALF_UP || (x / 10) & 1))) {
            x += 10;
        }
        *buf1 = powers10[pos] * (x - y);
    }
    /*
       In case we're rounding e.g. 1.5e9 to 2.0e9, the decimal_digit_t's inside
       the buffer are as follows.

       Before <1, 5e8>
       After  <2, 5e8>

       Hence we need to set the 2nd field to 0.
       The same holds if we round 1.5e-9 to 2e-9.
       */
    if (frac0 < frac1) {
        int32_t *buf = to->_buffer + ((scale == 0 && intg0 == 0) ? 1 : intg0 + frac0);
        int32_t *end = to->_buffer + len;
        while (buf < end) {
            *buf++ = 0;
        }
    }
    if (*buf1 >= DIG_BASE) {
        carry = 1;
        *buf1 -= DIG_BASE;
        while (carry && --buf1 >= to->_buffer) {
            add(0, *buf1, buf1, &carry);
        }
        if (carry) {
            /* shifting the number to create space for new digit */
            if (frac0 + intg0 >= len) {
                frac0--;
                scale = frac0 * DIG_PER_DEC1;
                error = E_DEC_TRUNCATED; /* XXX */
            }
            for (buf1 = to->_buffer + intg0 + std::max(frac0, 0); buf1 > to->_buffer; buf1--) {
                /* Avoid out-of-bounds write. */
                if (buf1 < to->_buffer + len) {
                    buf1[0] = buf1[-1];
                } else {
                    error = E_DEC_OVERFLOW;
                }
            }
            *buf1 = 1;
            /* We cannot have more than 9 * 9 = 81 digits. */
            if (to->_int_length < len * DIG_PER_DEC1) {
                to->_int_length++;
            } else {
                error = E_DEC_OVERFLOW;
            }
        }
    } else {
        for (;;) {
            if (*buf1) {
                break;
            }
            if (buf1-- == to->_buffer) {
                /* making 'zero' with the proper scale */
                int32_t *p0 = to->_buffer + frac0 + 1;
                to->_int_length = 1;
                to->_frac_length = std::max(scale, 0);
                to->_sign = 0;
                for (buf1 = to->_buffer; buf1 < p0; buf1++) {
                    *buf1 = 0;
                }
                return E_DEC_OK;
            }
        }
    }

    /* Here we  check 999.9 -> 1000 case when we need to increase intg */
    first_dig = to->_int_length % DIG_PER_DEC1;
    if (first_dig && (*buf1 >= powers10[first_dig])) {
        to->_int_length++;
    }

    if (scale < 0) {
        scale = 0;
    }

    to->_frac_length = scale;
    return error;
}

} // end namespace doris