ClickHouse/src/Functions/FunctionsConsistentHashing.h

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

161 lines
5.9 KiB
C++
Raw Normal View History

#pragma once
#include <Columns/ColumnConst.h>
#include <Columns/ColumnsNumber.h>
#include <DataTypes/DataTypesNumber.h>
#include <Functions/FunctionHelpers.h>
2021-05-17 07:30:42 +00:00
#include <Functions/IFunction.h>
#include <Common/typeid_cast.h>
2023-01-08 20:58:09 +00:00
#include <base/IPv4andIPv6.h>
#include <Interpreters/Context_fwd.h>
namespace DB
{
namespace ErrorCodes
{
2020-02-25 18:02:41 +00:00
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
extern const int BAD_ARGUMENTS;
}
template <typename Impl>
class FunctionConsistentHashImpl : public IFunction
{
public:
static constexpr auto name = Impl::name;
2021-06-01 12:20:52 +00:00
static FunctionPtr create(ContextPtr)
{
return std::make_shared<FunctionConsistentHashImpl<Impl>>();
2018-08-26 00:50:48 +00:00
}
String getName() const override
{
return name;
}
size_t getNumberOfArguments() const override
{
return 2;
}
2021-06-22 16:21:23 +00:00
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
{
2023-01-08 20:58:09 +00:00
if (!isInteger(arguments[0]) && !isIPv4(arguments[0]))
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of the first argument of function {}",
arguments[0]->getName(), getName());
if (arguments[0]->getSizeOfValueInMemory() > sizeof(HashType))
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Function {} accepts {}-bit integers at most, got {}",
getName(), sizeof(HashType) * 8, arguments[0]->getName());
if (!isInteger(arguments[1]))
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of the second argument of function {}",
arguments[1]->getName(), getName());
return std::make_shared<DataTypeNumber<ResultType>>();
}
bool useDefaultImplementationForConstants() const override
{
return true;
}
ColumnNumbers getArgumentsThatAreAlwaysConstant() const override
{
return {1};
}
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/) const override
{
2020-10-18 14:49:19 +00:00
if (isColumnConst(*arguments[1].column))
return executeConstBuckets(arguments);
else
throw Exception(ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} (number of buckets) must be constant",
getName());
}
private:
using HashType = typename Impl::HashType;
using ResultType = typename Impl::ResultType;
2019-08-02 22:40:28 +00:00
using BucketsType = typename Impl::BucketsType;
template <typename T>
2020-07-21 13:58:07 +00:00
inline BucketsType checkBucketsRange(T buckets) const
{
if (unlikely(buckets <= 0))
throw Exception(ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} (number of buckets) must be positive number", getName());
2019-08-02 22:40:28 +00:00
if (unlikely(static_cast<UInt64>(buckets) > Impl::max_buckets))
throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of the second argument of function {} "
"(number of buckets) must not be greater than {}", getName(), Impl::max_buckets);
return static_cast<BucketsType>(buckets);
}
ColumnPtr executeConstBuckets(const ColumnsWithTypeAndName & arguments) const
{
2020-10-18 14:49:19 +00:00
Field buckets_field = (*arguments[1].column)[0];
BucketsType num_buckets;
if (buckets_field.getType() == Field::Types::Int64)
num_buckets = checkBucketsRange(buckets_field.get<Int64>());
else if (buckets_field.getType() == Field::Types::UInt64)
num_buckets = checkBucketsRange(buckets_field.get<UInt64>());
else
2021-09-06 15:59:46 +00:00
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
"Illegal type {} of the second argument of function {}",
buckets_field.getTypeName(), getName());
2020-10-18 14:49:19 +00:00
const auto & hash_col = arguments[0].column;
const IDataType * hash_type = arguments[0].type.get();
auto res_col = ColumnVector<ResultType>::create();
WhichDataType which(hash_type);
if (which.isUInt8())
executeType<UInt8>(hash_col, num_buckets, res_col.get());
else if (which.isUInt16())
executeType<UInt16>(hash_col, num_buckets, res_col.get());
else if (which.isUInt32())
executeType<UInt32>(hash_col, num_buckets, res_col.get());
else if (which.isUInt64())
executeType<UInt64>(hash_col, num_buckets, res_col.get());
else if (which.isInt8())
executeType<Int8>(hash_col, num_buckets, res_col.get());
else if (which.isInt16())
executeType<Int16>(hash_col, num_buckets, res_col.get());
else if (which.isInt32())
executeType<Int32>(hash_col, num_buckets, res_col.get());
else if (which.isInt64())
executeType<Int64>(hash_col, num_buckets, res_col.get());
2023-01-08 20:58:09 +00:00
else if (which.isIPv4())
executeType<IPv4>(hash_col, num_buckets, res_col.get());
else
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of the first argument of function {}",
hash_type->getName(), getName());
2020-10-18 14:49:19 +00:00
return res_col;
}
template <typename CurrentHashType>
2020-07-21 13:58:07 +00:00
void executeType(const ColumnPtr & col_hash_ptr, BucketsType num_buckets, ColumnVector<ResultType> * col_result) const
{
auto col_hash = checkAndGetColumn<ColumnVector<CurrentHashType>>(col_hash_ptr.get());
if (!col_hash)
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of the first argument of function {}", getName());
auto & vec_result = col_result->getData();
const auto & vec_hash = col_hash->getData();
size_t size = vec_hash.size();
vec_result.resize(size);
for (size_t i = 0; i < size; ++i)
vec_result[i] = Impl::apply(static_cast<HashType>(vec_hash[i]), num_buckets);
}
};
}