add countDigits() function

2024-11-21 15:12:02 +00:00 · 2020-08-27 16:17:13 +03:00 · 2020-08-27 16:17:13 +03:00 · 2a0b98b19c
commit 2a0b98b19c
parent 724b38adc9
6 changed files with 204 additions and 35 deletions
--- a/src/Functions/countDigits.cpp
+++ b/src/Functions/countDigits.cpp
@ -0,0 +1,155 @@
+#include <Functions/IFunctionImpl.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypesDecimal.h>
+#include <Columns/ColumnsNumber.h>
+#include <Columns/ColumnDecimal.h>
+#include <Columns/ColumnConst.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+    extern const int ILLEGAL_COLUMN;
+}
+
+/// Returns 1 if and Decimal value has more digits then it's Precision allow, 0 otherwise.
+/// Precision could be set as second argument or omitted. If ommited function uses Decimal presicion of the first argument.
+class FunctionCountDigits : public IFunction
+{
+public:
+    static constexpr auto name = "countDigits";
+
+    static FunctionPtr create(const Context &)
+    {
+        return std::make_shared<FunctionCountDigits>();
+    }
+
+    String getName() const override { return name; }
+    bool useDefaultImplementationForNulls() const override { return false; }
+    size_t getNumberOfArguments() const override { return 1; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        WhichDataType which_first(arguments[0]->getTypeId());
+
+        if (!which_first.isInt() && !which_first.isUInt() && !which_first.isDecimal())
+            throw Exception("Illegal type " + arguments[0]->getName() + " of argument of function " + getName(),
+                            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        return std::make_shared<DataTypeUInt8>(); /// Up to 255 decimal digits.
+    }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result_pos, size_t input_rows_count) const override
+    {
+        const auto & src_column = block.getByPosition(arguments[0]);
+        if (!src_column.column)
+            throw Exception("Illegal column while execute function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        auto result_column = ColumnUInt8::create();
+
+        auto call = [&](const auto & types) -> bool
+        {
+            using Types = std::decay_t<decltype(types)>;
+            using Type = typename Types::RightType;
+            using ColVecType = std::conditional_t<IsDecimalNumber<Type>, ColumnDecimal<Type>, ColumnVector<Type>>;
+
+            if (const ColumnConst * const_column = checkAndGetColumnConst<ColVecType>(src_column.column.get()))
+            {
+                Type const_value = checkAndGetColumn<ColVecType>(const_column->getDataColumnPtr().get())->getData()[0];
+                UInt32 num_digits = 0;
+                if constexpr (IsDecimalNumber<Type>)
+                    num_digits = digits(const_value.value);
+                else
+                    num_digits = digits(const_value);
+                result_column->getData().resize_fill(input_rows_count, num_digits);
+                return true;
+            }
+            else if (const ColVecType * col_vec = checkAndGetColumn<ColVecType>(src_column.column.get()))
+            {
+                execute<Type>(*col_vec, *result_column, input_rows_count);
+                return true;
+            }
+
+            throw Exception("Illegal column while execute function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+        };
+
+        TypeIndex dec_type_idx = src_column.type->getTypeId();
+        if (!callOnBasicType<void, true, false, true, false>(dec_type_idx, call))
+            throw Exception("Wrong call for " + getName() + " with " + src_column.type->getName(),
+                            ErrorCodes::ILLEGAL_COLUMN);
+
+        block.getByPosition(result_pos).column = std::move(result_column);
+    }
+
+private:
+    template <typename T, typename ColVecType>
+    static void execute(const ColVecType & col, ColumnUInt8 & result_column, size_t rows_count)
+    {
+        using NativeT = typename NativeType<T>::Type;
+
+        const auto & src_data = col.getData();
+        auto & dst_data = result_column.getData();
+        dst_data.resize(rows_count);
+
+        for (size_t i = 0; i < rows_count; ++i)
+        {
+            if constexpr (IsDecimalNumber<T>)
+                dst_data[i] = digits<NativeT>(src_data[i].value);
+            else
+                dst_data[i] = digits<NativeT>(src_data[i]);
+        }
+    }
+
+    template <typename T>
+    static UInt32 digits(T value)
+    {
+        static_assert(!IsDecimalNumber<T>);
+        using DivT = std::conditional_t<is_signed_v<T>, Int32, UInt32>;
+
+        UInt32 res = 0;
+        T tmp;
+
+        if constexpr (sizeof(T) > sizeof(Int32))
+        {
+            static constexpr const DivT e9 = 1000000000;
+
+            tmp = value / e9;
+            while (tmp != 0)
+            {
+                value = tmp;
+                tmp /= e9;
+                res += 9;
+            }
+        }
+
+        static constexpr const DivT e3 = 1000;
+
+        tmp = value / e3;
+        while (tmp != 0)
+        {
+            value = tmp;
+            tmp /= e3;
+            res += 3;
+        }
+
+        while (value != 0)
+        {
+            value /= 10;
+            ++res;
+        }
+        return res;
+    }
+};
+
+
+void registerFunctionCountDigits(FunctionFactory & factory)
+{
+    factory.registerFunction<FunctionCountDigits>();
+}
+
+}
--- a/src/Functions/isDecimalOverflow.cpp
+++ b/src/Functions/isDecimalOverflow.cpp
@ -6,6 +6,7 @@
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnDecimal.h>
 #include <Columns/ColumnConst.h>
+#include <Common/intExp.h>


 namespace DB
@ -37,7 +38,7 @@ public:

    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
-        if (arguments.size() < 1 || arguments.size() > 2)
+        if (arguments.empty() || arguments.size() > 2)
            throw Exception("Number of arguments for function " + getName() + " doesn't match: passed " +
                toString(arguments.size()) + ", should be 1 or 2.", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);

@ -87,13 +88,12 @@ public:
        {
            using Types = std::decay_t<decltype(types)>;
            using Type = typename Types::RightType;
-            using NativeT = typename Type::NativeType;
            using ColVecType = ColumnDecimal<Type>;

            if (const ColumnConst * const_column = checkAndGetColumnConst<ColVecType>(src_column.column.get()))
            {
                Type const_decimal = checkAndGetColumn<ColVecType>(const_column->getDataColumnPtr().get())->getData()[0];
-                UInt8 res_value = (digits<NativeT>(const_decimal.value) > precision);
+                UInt8 res_value = outOfDigits<Type>(const_decimal, precision);
                result_column->getData().resize_fill(input_rows_count, res_value);
                return true;
            }
@ -118,50 +118,28 @@ private:
    template <typename T>
    static void execute(const ColumnDecimal<T> & col, ColumnUInt8 & result_column, size_t rows_count, UInt32 precision)
    {
-        using NativeT = typename T::NativeType;
-
        const auto & src_data = col.getData();
        auto & dst_data = result_column.getData();
        dst_data.resize(rows_count);

        for (size_t i = 0; i < rows_count; ++i)
-            dst_data[i] = (digits<NativeT>(src_data[i].value) > precision);
+            dst_data[i] = outOfDigits<T>(src_data[i], precision);
    }

    template <typename T>
-    static UInt32 digits(T value)
+    static bool outOfDigits(T dec, UInt32 precision)
    {
-        UInt32 res = 0;
-        T tmp;
+        static_assert(IsDecimalNumber<T>);
+        using NativeT = typename T::NativeType;

-        static constexpr const Int32 e3 = 1000;
-        static constexpr const Int32 e9 = 1000000000;
+        if (precision > DecimalUtils::maxPrecision<T>())
+            return false;

-        if constexpr (sizeof(T) > sizeof(Int32))
-        {
-            tmp = value / e9;
-            while (tmp)
-            {
-                value = tmp;
-                tmp /= e9;
-                res += 9;
-            }
-        }
+        NativeT pow10 = intExp10OfSize<NativeT>(precision);

-        tmp = value / e3;
-        while (tmp)
-        {
-            value = tmp;
-            tmp /= e3;
-            res += 3;
-        }
-
-        while (value)
-        {
-            value /= 10;
-            ++res;
-        }
-        return res;
+        if (dec.value < 0)
+            return dec.value <= -pow10;
+        return dec.value >= pow10;
    }
 };

--- a/src/Functions/registerFunctionsMiscellaneous.cpp
+++ b/src/Functions/registerFunctionsMiscellaneous.cpp
@ -60,6 +60,7 @@ void registerFunctionGetScalar(FunctionFactory &);
 void registerFunctionGetSetting(FunctionFactory &);
 void registerFunctionIsConstant(FunctionFactory &);
 void registerFunctionIsDecimalOverflow(FunctionFactory &);
+void registerFunctionCountDigits(FunctionFactory &);
 void registerFunctionGlobalVariable(FunctionFactory &);
 void registerFunctionHasThreadFuzzer(FunctionFactory &);
 void registerFunctionInitializeAggregation(FunctionFactory &);
@ -123,6 +124,7 @@ void registerFunctionsMiscellaneous(FunctionFactory & factory)
    registerFunctionGetSetting(factory);
    registerFunctionIsConstant(factory);
    registerFunctionIsDecimalOverflow(factory);
+    registerFunctionCountDigits(factory);
    registerFunctionGlobalVariable(factory);
    registerFunctionHasThreadFuzzer(factory);
    registerFunctionInitializeAggregation(factory);
--- a/src/Functions/ya.make
+++ b/src/Functions/ya.make
@ -132,6 +132,7 @@ SRCS(
    concat.cpp
    convertCharset.cpp
    cos.cpp
+    countDigits.cpp
    CRC.cpp
    currentDatabase.cpp
    currentUser.cpp
@ -243,6 +244,7 @@ SRCS(
    intExp10.cpp
    intExp2.cpp
    isConstant.cpp
+    isDecimalOverflow.cpp
    isFinite.cpp
    isInfinite.cpp
    isNaN.cpp
--- a/tests/queries/0_stateless/01458_count_digits.reference
+++ b/tests/queries/0_stateless/01458_count_digits.reference
@ -0,0 +1,6 @@
+0	2	2	0	2	3	0	2	4
+2	3	4
+10	10	19	19	39	39
+2	2	2	2	2	2	2	2	2	2	2	2
+0	0	0	0	0	0	0	0	0	0	0	0
+3	3	3	5	5	5	10	10	10	19	19	20
--- a/tests/queries/0_stateless/01458_count_digits.sql
+++ b/tests/queries/0_stateless/01458_count_digits.sql
@ -0,0 +1,26 @@
+SELECT countDigits(toDecimal32(0, 0)), countDigits(toDecimal32(42, 0)), countDigits(toDecimal32(4.2, 1)),
+       countDigits(toDecimal64(0, 0)), countDigits(toDecimal64(42, 0)), countDigits(toDecimal64(4.2, 2)),
+       countDigits(toDecimal128(0, 0)), countDigits(toDecimal128(42, 0)), countDigits(toDecimal128(4.2, 3));
+
+SELECT countDigits(materialize(toDecimal32(4.2, 1))),
+       countDigits(materialize(toDecimal64(4.2, 2))),
+       countDigits(materialize(toDecimal128(4.2, 3)));
+
+SELECT countDigits(toDecimal32(1, 9)), countDigits(toDecimal32(-1, 9)),
+       countDigits(toDecimal64(1, 18)), countDigits(toDecimal64(-1, 18)),
+       countDigits(toDecimal128(1, 38)), countDigits(toDecimal128(-1, 38));
+       
+SELECT countDigits(toInt8(42)), countDigits(toInt8(-42)), countDigits(toUInt8(42)),
+       countDigits(toInt16(42)), countDigits(toInt16(-42)), countDigits(toUInt16(42)),
+       countDigits(toInt32(42)), countDigits(toInt32(-42)), countDigits(toUInt32(42)),
+       countDigits(toInt64(42)), countDigits(toInt64(-42)), countDigits(toUInt64(42));
+
+SELECT countDigits(toInt8(0)), countDigits(toInt8(0)),  countDigits(toUInt8(0)),
+       countDigits(toInt16(0)), countDigits(toInt16(0)), countDigits(toUInt16(0)),
+       countDigits(toInt32(0)), countDigits(toInt32(0)), countDigits(toUInt32(0)),
+       countDigits(toInt64(0)), countDigits(toInt64(0)), countDigits(toUInt64(0));
+       
+SELECT countDigits(toInt8(127)), countDigits(toInt8(-128)),  countDigits(toUInt8(255)),
+       countDigits(toInt16(32767)), countDigits(toInt16(-32768)), countDigits(toUInt16(65535)),
+       countDigits(toInt32(2147483647)), countDigits(toInt32(-2147483648)), countDigits(toUInt32(4294967295)),
+       countDigits(toInt64(9223372036854775807)), countDigits(toInt64(-9223372036854775808)), countDigits(toUInt64(18446744073709551615));