mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-16 19:32:07 +00:00
0753fd1c77
Less duplication, less confusion ...
148 lines
5.1 KiB
C++
148 lines
5.1 KiB
C++
#include "config.h"
|
|
|
|
#if USE_H3
|
|
|
|
#include <vector>
|
|
#include <Columns/ColumnArray.h>
|
|
#include <Columns/ColumnsNumber.h>
|
|
#include <DataTypes/DataTypeArray.h>
|
|
#include <DataTypes/DataTypesNumber.h>
|
|
#include <DataTypes/IDataType.h>
|
|
#include <Functions/FunctionFactory.h>
|
|
#include <Functions/IFunction.h>
|
|
#include <Common/typeid_cast.h>
|
|
#include <Interpreters/castColumn.h>
|
|
|
|
#include <h3api.h>
|
|
|
|
|
|
namespace DB
|
|
{
|
|
|
|
namespace ErrorCodes
|
|
{
|
|
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
|
|
extern const int PARAMETER_OUT_OF_BOUND;
|
|
extern const int ILLEGAL_COLUMN;
|
|
}
|
|
|
|
namespace
|
|
{
|
|
|
|
class FunctionH3KRing : public IFunction
|
|
{
|
|
public:
|
|
static constexpr auto name = "h3kRing";
|
|
|
|
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionH3KRing>(); }
|
|
|
|
std::string getName() const override { return name; }
|
|
|
|
size_t getNumberOfArguments() const override { return 2; }
|
|
bool useDefaultImplementationForConstants() const override { return true; }
|
|
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
|
|
|
|
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
|
|
{
|
|
const auto * arg = arguments[0].get();
|
|
if (!WhichDataType(arg).isUInt64())
|
|
throw Exception(
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
"Illegal type {} of argument {} of function {}. Must be UInt64",
|
|
arg->getName(), 1, getName());
|
|
|
|
arg = arguments[1].get();
|
|
if (!WhichDataType(arg).isNativeUInt())
|
|
throw Exception(
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
"Illegal type {} of argument {} of function {}. Must be unsigned native integer.",
|
|
arg->getName(),
|
|
2,
|
|
getName());
|
|
|
|
return std::make_shared<DataTypeArray>(std::make_shared<DataTypeUInt64>());
|
|
}
|
|
|
|
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
|
|
{
|
|
auto non_const_arguments = arguments;
|
|
for (auto & argument : non_const_arguments)
|
|
argument.column = argument.column->convertToFullColumnIfConst();
|
|
|
|
const auto * col_hindex = checkAndGetColumn<ColumnUInt64>(non_const_arguments[0].column.get());
|
|
if (!col_hindex)
|
|
throw Exception(
|
|
ErrorCodes::ILLEGAL_COLUMN,
|
|
"Illegal type {} of argument {} of function {}. Must be UInt64.",
|
|
arguments[0].type->getName(),
|
|
1,
|
|
getName());
|
|
|
|
const auto & data_hindex = col_hindex->getData();
|
|
|
|
/// ColumnUInt16 is sufficient as the max value of 2nd arg is checked (arg > 0 < 10000) in implementation below
|
|
auto cast_result = castColumnAccurate(non_const_arguments[1], std::make_shared<DataTypeUInt16>());
|
|
const auto * col_k = checkAndGetColumn<ColumnUInt16>(cast_result.get());
|
|
if (!col_k)
|
|
throw Exception(
|
|
ErrorCodes::ILLEGAL_COLUMN,
|
|
"Illegal type {} of argument {} of function {}. Must be UInt16.",
|
|
arguments[1].type->getName(),
|
|
2,
|
|
getName());
|
|
|
|
const auto & data_k = col_k->getData();
|
|
|
|
auto dst = ColumnArray::create(ColumnUInt64::create());
|
|
auto & dst_data = dst->getData();
|
|
auto & dst_offsets = dst->getOffsets();
|
|
dst_offsets.resize(input_rows_count);
|
|
auto current_offset = 0;
|
|
|
|
for (size_t row = 0; row < input_rows_count; ++row)
|
|
{
|
|
const H3Index origin_hindex = data_hindex[row];
|
|
const int k = data_k[row];
|
|
|
|
/// Overflow is possible. The function maxGridDiskSize does not check for overflow.
|
|
/// The calculation is similar to square of k but several times more.
|
|
/// Let's use huge underestimation as the safe bound. We should not allow to generate too large arrays nevertheless.
|
|
constexpr auto max_k = 10000;
|
|
if (k > max_k)
|
|
throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Too large 'k' argument for {} function, maximum {}", getName(), max_k);
|
|
/// Check is already made while fetching the argument for k (to determine if it's an unsigned integer). Nevertheless, it's checked again here.
|
|
if (k < 0)
|
|
throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Argument 'k' for {} function must be non negative", getName());
|
|
|
|
const auto vec_size = maxGridDiskSize(k);
|
|
std::vector<H3Index> hindex_vec;
|
|
hindex_vec.resize(vec_size);
|
|
gridDisk(origin_hindex, k, hindex_vec.data());
|
|
|
|
dst_data.reserve(dst_data.size() + vec_size);
|
|
for (auto hindex : hindex_vec)
|
|
{
|
|
if (hindex != 0)
|
|
{
|
|
++current_offset;
|
|
dst_data.insert(hindex);
|
|
}
|
|
}
|
|
dst_offsets[row] = current_offset;
|
|
}
|
|
|
|
return dst;
|
|
}
|
|
};
|
|
|
|
}
|
|
|
|
REGISTER_FUNCTION(H3KRing)
|
|
{
|
|
factory.registerFunction<FunctionH3KRing>();
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|