add countDigits() function

2024-11-21 15:12:02 +00:00 · 2020-08-27 16:17:13 +03:00 · 2020-08-27 16:17:13 +03:00 · 2a0b98b19c
commit 2a0b98b19c
parent 724b38adc9
6 changed files with 204 additions and 35 deletions
--- a/src/Functions/countDigits.cpp
+++ b/src/Functions/countDigits.cpp
@ -0,0 +1,155 @@
 #include <Functions/IFunctionImpl.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypesDecimal.h>
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnDecimal.h>
 #include <Columns/ColumnConst.h>
 namespace DB
 {
 namespace ErrorCodes
 {
    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
    extern const int ILLEGAL_COLUMN;
 }
 /// Returns 1 if and Decimal value has more digits then it's Precision allow, 0 otherwise.
 /// Precision could be set as second argument or omitted. If ommited function uses Decimal presicion of the first argument.
 class FunctionCountDigits : public IFunction
 {
 public:
    static constexpr auto name = "countDigits";
    static FunctionPtr create(const Context &)
    {
        return std::make_shared<FunctionCountDigits>();
    }
    String getName() const override { return name; }
    bool useDefaultImplementationForNulls() const override { return false; }
    size_t getNumberOfArguments() const override { return 1; }
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
        WhichDataType which_first(arguments[0]->getTypeId());
        if (!which_first.isInt() && !which_first.isUInt() && !which_first.isDecimal())
            throw Exception("Illegal type " + arguments[0]->getName() + " of argument of function " + getName(),
                            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        return std::make_shared<DataTypeUInt8>(); /// Up to 255 decimal digits.
    }
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result_pos, size_t input_rows_count) const override
    {
        const auto & src_column = block.getByPosition(arguments[0]);
        if (!src_column.column)
            throw Exception("Illegal column while execute function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        auto result_column = ColumnUInt8::create();
        auto call = [&](const auto & types) -> bool
        {
            using Types = std::decay_t<decltype(types)>;
            using Type = typename Types::RightType;
            using ColVecType = std::conditional_t<IsDecimalNumber<Type>, ColumnDecimal<Type>, ColumnVector<Type>>;
            if (const ColumnConst * const_column = checkAndGetColumnConst<ColVecType>(src_column.column.get()))
            {
                Type const_value = checkAndGetColumn<ColVecType>(const_column->getDataColumnPtr().get())->getData()[0];
                UInt32 num_digits = 0;
                if constexpr (IsDecimalNumber<Type>)
                    num_digits = digits(const_value.value);
                else
                    num_digits = digits(const_value);
                result_column->getData().resize_fill(input_rows_count, num_digits);
                return true;
            }
            else if (const ColVecType * col_vec = checkAndGetColumn<ColVecType>(src_column.column.get()))
            {
                execute<Type>(*col_vec, *result_column, input_rows_count);
                return true;
            }
            throw Exception("Illegal column while execute function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        };
        TypeIndex dec_type_idx = src_column.type->getTypeId();
        if (!callOnBasicType<void, true, false, true, false>(dec_type_idx, call))
            throw Exception("Wrong call for " + getName() + " with " + src_column.type->getName(),
                            ErrorCodes::ILLEGAL_COLUMN);
        block.getByPosition(result_pos).column = std::move(result_column);
    }
 private:
    template <typename T, typename ColVecType>
    static void execute(const ColVecType & col, ColumnUInt8 & result_column, size_t rows_count)
    {
        using NativeT = typename NativeType<T>::Type;
        const auto & src_data = col.getData();
        auto & dst_data = result_column.getData();
        dst_data.resize(rows_count);
        for (size_t i = 0; i < rows_count; ++i)
        {
            if constexpr (IsDecimalNumber<T>)
                dst_data[i] = digits<NativeT>(src_data[i].value);
            else
                dst_data[i] = digits<NativeT>(src_data[i]);
        }
    }
    template <typename T>
    static UInt32 digits(T value)
    {
        static_assert(!IsDecimalNumber<T>);
        using DivT = std::conditional_t<is_signed_v<T>, Int32, UInt32>;
        UInt32 res = 0;
        T tmp;
        if constexpr (sizeof(T) > sizeof(Int32))
        {
            static constexpr const DivT e9 = 1000000000;
            tmp = value / e9;
            while (tmp != 0)
            {
                value = tmp;
                tmp /= e9;
                res += 9;
            }
        }
        static constexpr const DivT e3 = 1000;
        tmp = value / e3;
        while (tmp != 0)
        {
            value = tmp;
            tmp /= e3;
            res += 3;
        }
        while (value != 0)
        {
            value /= 10;
            ++res;
        }
        return res;
    }
 };
 void registerFunctionCountDigits(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionCountDigits>();
 }
 }
--- a/src/Functions/isDecimalOverflow.cpp
+++ b/src/Functions/isDecimalOverflow.cpp
@ -6,6 +6,7 @@
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnDecimal.h>
 #include <Columns/ColumnConst.h>
 #include <Common/intExp.h>
 namespace DB
@ -37,7 +38,7 @@ public:
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
-        if (arguments.size() < 1 || arguments.size() > 2)
+        if (arguments.empty() || arguments.size() > 2)
            throw Exception("Number of arguments for function " + getName() + " doesn't match: passed " +
                toString(arguments.size()) + ", should be 1 or 2.", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
@ -87,13 +88,12 @@ public:
        {
            using Types = std::decay_t<decltype(types)>;
            using Type = typename Types::RightType;
            using NativeT = typename Type::NativeType;
            using ColVecType = ColumnDecimal<Type>;
            if (const ColumnConst * const_column = checkAndGetColumnConst<ColVecType>(src_column.column.get()))
            {
                Type const_decimal = checkAndGetColumn<ColVecType>(const_column->getDataColumnPtr().get())->getData()[0];
-                UInt8 res_value = (digits<NativeT>(const_decimal.value) > precision);
+                UInt8 res_value = outOfDigits<Type>(const_decimal, precision);
                result_column->getData().resize_fill(input_rows_count, res_value);
                return true;
            }
@ -118,50 +118,28 @@ private:
    template <typename T>
    static void execute(const ColumnDecimal<T> & col, ColumnUInt8 & result_column, size_t rows_count, UInt32 precision)
    {
        using NativeT = typename T::NativeType;
        const auto & src_data = col.getData();
        auto & dst_data = result_column.getData();
        dst_data.resize(rows_count);
        for (size_t i = 0; i < rows_count; ++i)
-            dst_data[i] = (digits<NativeT>(src_data[i].value) > precision);
+            dst_data[i] = outOfDigits<T>(src_data[i], precision);
    }
    template <typename T>
-    static UInt32 digits(T value)
+    static bool outOfDigits(T dec, UInt32 precision)
    {
-        UInt32 res = 0;
+        static_assert(IsDecimalNumber<T>);
-        T tmp;
+        using NativeT = typename T::NativeType;
-        static constexpr const Int32 e3 = 1000;
+        if (precision > DecimalUtils::maxPrecision<T>())
-        static constexpr const Int32 e9 = 1000000000;
+            return false;
-        if constexpr (sizeof(T) > sizeof(Int32))
+        NativeT pow10 = intExp10OfSize<NativeT>(precision);
        {
            tmp = value / e9;
            while (tmp)
            {
                value = tmp;
                tmp /= e9;
                res += 9;
            }
        }
-        tmp = value / e3;
+        if (dec.value < 0)
-        while (tmp)
+            return dec.value <= -pow10;
-        {
+        return dec.value >= pow10;
            value = tmp;
            tmp /= e3;
            res += 3;
        }
        while (value)
        {
            value /= 10;
            ++res;
        }
        return res;
    }
 };
--- a/src/Functions/registerFunctionsMiscellaneous.cpp
+++ b/src/Functions/registerFunctionsMiscellaneous.cpp
@ -60,6 +60,7 @@ void registerFunctionGetScalar(FunctionFactory &);
 void registerFunctionGetSetting(FunctionFactory &);
 void registerFunctionIsConstant(FunctionFactory &);
 void registerFunctionIsDecimalOverflow(FunctionFactory &);
 void registerFunctionCountDigits(FunctionFactory &);
 void registerFunctionGlobalVariable(FunctionFactory &);
 void registerFunctionHasThreadFuzzer(FunctionFactory &);
 void registerFunctionInitializeAggregation(FunctionFactory &);
@ -123,6 +124,7 @@ void registerFunctionsMiscellaneous(FunctionFactory & factory)
    registerFunctionGetSetting(factory);
    registerFunctionIsConstant(factory);
    registerFunctionIsDecimalOverflow(factory);
    registerFunctionCountDigits(factory);
    registerFunctionGlobalVariable(factory);
    registerFunctionHasThreadFuzzer(factory);
    registerFunctionInitializeAggregation(factory);
--- a/src/Functions/ya.make
+++ b/src/Functions/ya.make
@ -132,6 +132,7 @@ SRCS(
    concat.cpp
    convertCharset.cpp
    cos.cpp
    countDigits.cpp
    CRC.cpp
    currentDatabase.cpp
    currentUser.cpp
@ -243,6 +244,7 @@ SRCS(
    intExp10.cpp
    intExp2.cpp
    isConstant.cpp
    isDecimalOverflow.cpp
    isFinite.cpp
    isInfinite.cpp
    isNaN.cpp
--- a/tests/queries/0_stateless/01458_count_digits.reference
+++ b/tests/queries/0_stateless/01458_count_digits.reference
@ -0,0 +1,6 @@
 0	2	2	0	2	3	0	2	4
 2	3	4
 10	10	19	19	39	39
 2	2	2	2	2	2	2	2	2	2	2	2
 0	0	0	0	0	0	0	0	0	0	0	0
 3	3	3	5	5	5	10	10	10	19	19	20
--- a/tests/queries/0_stateless/01458_count_digits.sql
+++ b/tests/queries/0_stateless/01458_count_digits.sql
@ -0,0 +1,26 @@
 SELECT countDigits(toDecimal32(0, 0)), countDigits(toDecimal32(42, 0)), countDigits(toDecimal32(4.2, 1)),
       countDigits(toDecimal64(0, 0)), countDigits(toDecimal64(42, 0)), countDigits(toDecimal64(4.2, 2)),
       countDigits(toDecimal128(0, 0)), countDigits(toDecimal128(42, 0)), countDigits(toDecimal128(4.2, 3));
 SELECT countDigits(materialize(toDecimal32(4.2, 1))),
       countDigits(materialize(toDecimal64(4.2, 2))),
       countDigits(materialize(toDecimal128(4.2, 3)));
 SELECT countDigits(toDecimal32(1, 9)), countDigits(toDecimal32(-1, 9)),
       countDigits(toDecimal64(1, 18)), countDigits(toDecimal64(-1, 18)),
       countDigits(toDecimal128(1, 38)), countDigits(toDecimal128(-1, 38));
 SELECT countDigits(toInt8(42)), countDigits(toInt8(-42)), countDigits(toUInt8(42)),
       countDigits(toInt16(42)), countDigits(toInt16(-42)), countDigits(toUInt16(42)),
       countDigits(toInt32(42)), countDigits(toInt32(-42)), countDigits(toUInt32(42)),
       countDigits(toInt64(42)), countDigits(toInt64(-42)), countDigits(toUInt64(42));
 SELECT countDigits(toInt8(0)), countDigits(toInt8(0)),  countDigits(toUInt8(0)),
       countDigits(toInt16(0)), countDigits(toInt16(0)), countDigits(toUInt16(0)),
       countDigits(toInt32(0)), countDigits(toInt32(0)), countDigits(toUInt32(0)),
       countDigits(toInt64(0)), countDigits(toInt64(0)), countDigits(toUInt64(0));
 SELECT countDigits(toInt8(127)), countDigits(toInt8(-128)),  countDigits(toUInt8(255)),
       countDigits(toInt16(32767)), countDigits(toInt16(-32768)), countDigits(toUInt16(65535)),
       countDigits(toInt32(2147483647)), countDigits(toInt32(-2147483648)), countDigits(toUInt32(4294967295)),
       countDigits(toInt64(9223372036854775807)), countDigits(toInt64(-9223372036854775808)), countDigits(toUInt64(18446744073709551615));