add countDigits() function

This commit is contained in:
Artem Zuikov 2020-08-27 16:17:13 +03:00
parent 724b38adc9
commit 2a0b98b19c
6 changed files with 204 additions and 35 deletions

View File

@ -0,0 +1,155 @@
#include <Functions/IFunctionImpl.h>
#include <Functions/FunctionFactory.h>
#include <Functions/FunctionHelpers.h>
#include <DataTypes/DataTypesNumber.h>
#include <DataTypes/DataTypesDecimal.h>
#include <Columns/ColumnsNumber.h>
#include <Columns/ColumnDecimal.h>
#include <Columns/ColumnConst.h>
namespace DB
{
namespace ErrorCodes
{
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
extern const int ILLEGAL_COLUMN;
}
/// Returns 1 if and Decimal value has more digits then it's Precision allow, 0 otherwise.
/// Precision could be set as second argument or omitted. If ommited function uses Decimal presicion of the first argument.
class FunctionCountDigits : public IFunction
{
public:
static constexpr auto name = "countDigits";
static FunctionPtr create(const Context &)
{
return std::make_shared<FunctionCountDigits>();
}
String getName() const override { return name; }
bool useDefaultImplementationForNulls() const override { return false; }
size_t getNumberOfArguments() const override { return 1; }
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
{
WhichDataType which_first(arguments[0]->getTypeId());
if (!which_first.isInt() && !which_first.isUInt() && !which_first.isDecimal())
throw Exception("Illegal type " + arguments[0]->getName() + " of argument of function " + getName(),
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
return std::make_shared<DataTypeUInt8>(); /// Up to 255 decimal digits.
}
void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result_pos, size_t input_rows_count) const override
{
const auto & src_column = block.getByPosition(arguments[0]);
if (!src_column.column)
throw Exception("Illegal column while execute function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
auto result_column = ColumnUInt8::create();
auto call = [&](const auto & types) -> bool
{
using Types = std::decay_t<decltype(types)>;
using Type = typename Types::RightType;
using ColVecType = std::conditional_t<IsDecimalNumber<Type>, ColumnDecimal<Type>, ColumnVector<Type>>;
if (const ColumnConst * const_column = checkAndGetColumnConst<ColVecType>(src_column.column.get()))
{
Type const_value = checkAndGetColumn<ColVecType>(const_column->getDataColumnPtr().get())->getData()[0];
UInt32 num_digits = 0;
if constexpr (IsDecimalNumber<Type>)
num_digits = digits(const_value.value);
else
num_digits = digits(const_value);
result_column->getData().resize_fill(input_rows_count, num_digits);
return true;
}
else if (const ColVecType * col_vec = checkAndGetColumn<ColVecType>(src_column.column.get()))
{
execute<Type>(*col_vec, *result_column, input_rows_count);
return true;
}
throw Exception("Illegal column while execute function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
};
TypeIndex dec_type_idx = src_column.type->getTypeId();
if (!callOnBasicType<void, true, false, true, false>(dec_type_idx, call))
throw Exception("Wrong call for " + getName() + " with " + src_column.type->getName(),
ErrorCodes::ILLEGAL_COLUMN);
block.getByPosition(result_pos).column = std::move(result_column);
}
private:
template <typename T, typename ColVecType>
static void execute(const ColVecType & col, ColumnUInt8 & result_column, size_t rows_count)
{
using NativeT = typename NativeType<T>::Type;
const auto & src_data = col.getData();
auto & dst_data = result_column.getData();
dst_data.resize(rows_count);
for (size_t i = 0; i < rows_count; ++i)
{
if constexpr (IsDecimalNumber<T>)
dst_data[i] = digits<NativeT>(src_data[i].value);
else
dst_data[i] = digits<NativeT>(src_data[i]);
}
}
template <typename T>
static UInt32 digits(T value)
{
static_assert(!IsDecimalNumber<T>);
using DivT = std::conditional_t<is_signed_v<T>, Int32, UInt32>;
UInt32 res = 0;
T tmp;
if constexpr (sizeof(T) > sizeof(Int32))
{
static constexpr const DivT e9 = 1000000000;
tmp = value / e9;
while (tmp != 0)
{
value = tmp;
tmp /= e9;
res += 9;
}
}
static constexpr const DivT e3 = 1000;
tmp = value / e3;
while (tmp != 0)
{
value = tmp;
tmp /= e3;
res += 3;
}
while (value != 0)
{
value /= 10;
++res;
}
return res;
}
};
void registerFunctionCountDigits(FunctionFactory & factory)
{
factory.registerFunction<FunctionCountDigits>();
}
}

View File

@ -6,6 +6,7 @@
#include <Columns/ColumnsNumber.h>
#include <Columns/ColumnDecimal.h>
#include <Columns/ColumnConst.h>
#include <Common/intExp.h>
namespace DB
@ -37,7 +38,7 @@ public:
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
{
if (arguments.size() < 1 || arguments.size() > 2)
if (arguments.empty() || arguments.size() > 2)
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed " +
toString(arguments.size()) + ", should be 1 or 2.", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
@ -87,13 +88,12 @@ public:
{
using Types = std::decay_t<decltype(types)>;
using Type = typename Types::RightType;
using NativeT = typename Type::NativeType;
using ColVecType = ColumnDecimal<Type>;
if (const ColumnConst * const_column = checkAndGetColumnConst<ColVecType>(src_column.column.get()))
{
Type const_decimal = checkAndGetColumn<ColVecType>(const_column->getDataColumnPtr().get())->getData()[0];
UInt8 res_value = (digits<NativeT>(const_decimal.value) > precision);
UInt8 res_value = outOfDigits<Type>(const_decimal, precision);
result_column->getData().resize_fill(input_rows_count, res_value);
return true;
}
@ -118,50 +118,28 @@ private:
template <typename T>
static void execute(const ColumnDecimal<T> & col, ColumnUInt8 & result_column, size_t rows_count, UInt32 precision)
{
using NativeT = typename T::NativeType;
const auto & src_data = col.getData();
auto & dst_data = result_column.getData();
dst_data.resize(rows_count);
for (size_t i = 0; i < rows_count; ++i)
dst_data[i] = (digits<NativeT>(src_data[i].value) > precision);
dst_data[i] = outOfDigits<T>(src_data[i], precision);
}
template <typename T>
static UInt32 digits(T value)
static bool outOfDigits(T dec, UInt32 precision)
{
UInt32 res = 0;
T tmp;
static_assert(IsDecimalNumber<T>);
using NativeT = typename T::NativeType;
static constexpr const Int32 e3 = 1000;
static constexpr const Int32 e9 = 1000000000;
if (precision > DecimalUtils::maxPrecision<T>())
return false;
if constexpr (sizeof(T) > sizeof(Int32))
{
tmp = value / e9;
while (tmp)
{
value = tmp;
tmp /= e9;
res += 9;
}
}
NativeT pow10 = intExp10OfSize<NativeT>(precision);
tmp = value / e3;
while (tmp)
{
value = tmp;
tmp /= e3;
res += 3;
}
while (value)
{
value /= 10;
++res;
}
return res;
if (dec.value < 0)
return dec.value <= -pow10;
return dec.value >= pow10;
}
};

View File

@ -60,6 +60,7 @@ void registerFunctionGetScalar(FunctionFactory &);
void registerFunctionGetSetting(FunctionFactory &);
void registerFunctionIsConstant(FunctionFactory &);
void registerFunctionIsDecimalOverflow(FunctionFactory &);
void registerFunctionCountDigits(FunctionFactory &);
void registerFunctionGlobalVariable(FunctionFactory &);
void registerFunctionHasThreadFuzzer(FunctionFactory &);
void registerFunctionInitializeAggregation(FunctionFactory &);
@ -123,6 +124,7 @@ void registerFunctionsMiscellaneous(FunctionFactory & factory)
registerFunctionGetSetting(factory);
registerFunctionIsConstant(factory);
registerFunctionIsDecimalOverflow(factory);
registerFunctionCountDigits(factory);
registerFunctionGlobalVariable(factory);
registerFunctionHasThreadFuzzer(factory);
registerFunctionInitializeAggregation(factory);

View File

@ -132,6 +132,7 @@ SRCS(
concat.cpp
convertCharset.cpp
cos.cpp
countDigits.cpp
CRC.cpp
currentDatabase.cpp
currentUser.cpp
@ -243,6 +244,7 @@ SRCS(
intExp10.cpp
intExp2.cpp
isConstant.cpp
isDecimalOverflow.cpp
isFinite.cpp
isInfinite.cpp
isNaN.cpp

View File

@ -0,0 +1,6 @@
0 2 2 0 2 3 0 2 4
2 3 4
10 10 19 19 39 39
2 2 2 2 2 2 2 2 2 2 2 2
0 0 0 0 0 0 0 0 0 0 0 0
3 3 3 5 5 5 10 10 10 19 19 20

View File

@ -0,0 +1,26 @@
SELECT countDigits(toDecimal32(0, 0)), countDigits(toDecimal32(42, 0)), countDigits(toDecimal32(4.2, 1)),
countDigits(toDecimal64(0, 0)), countDigits(toDecimal64(42, 0)), countDigits(toDecimal64(4.2, 2)),
countDigits(toDecimal128(0, 0)), countDigits(toDecimal128(42, 0)), countDigits(toDecimal128(4.2, 3));
SELECT countDigits(materialize(toDecimal32(4.2, 1))),
countDigits(materialize(toDecimal64(4.2, 2))),
countDigits(materialize(toDecimal128(4.2, 3)));
SELECT countDigits(toDecimal32(1, 9)), countDigits(toDecimal32(-1, 9)),
countDigits(toDecimal64(1, 18)), countDigits(toDecimal64(-1, 18)),
countDigits(toDecimal128(1, 38)), countDigits(toDecimal128(-1, 38));
SELECT countDigits(toInt8(42)), countDigits(toInt8(-42)), countDigits(toUInt8(42)),
countDigits(toInt16(42)), countDigits(toInt16(-42)), countDigits(toUInt16(42)),
countDigits(toInt32(42)), countDigits(toInt32(-42)), countDigits(toUInt32(42)),
countDigits(toInt64(42)), countDigits(toInt64(-42)), countDigits(toUInt64(42));
SELECT countDigits(toInt8(0)), countDigits(toInt8(0)), countDigits(toUInt8(0)),
countDigits(toInt16(0)), countDigits(toInt16(0)), countDigits(toUInt16(0)),
countDigits(toInt32(0)), countDigits(toInt32(0)), countDigits(toUInt32(0)),
countDigits(toInt64(0)), countDigits(toInt64(0)), countDigits(toUInt64(0));
SELECT countDigits(toInt8(127)), countDigits(toInt8(-128)), countDigits(toUInt8(255)),
countDigits(toInt16(32767)), countDigits(toInt16(-32768)), countDigits(toUInt16(65535)),
countDigits(toInt32(2147483647)), countDigits(toInt32(-2147483648)), countDigits(toUInt32(4294967295)),
countDigits(toInt64(9223372036854775807)), countDigits(toInt64(-9223372036854775808)), countDigits(toUInt64(18446744073709551615));