ClickHouse/src/Functions/h3kRing.cpp

148 lines
5.1 KiB
C++
Raw Normal View History

2021-10-27 23:10:39 +00:00
#include "config_functions.h"
2020-11-04 14:51:41 +00:00
#if USE_H3
2020-06-19 10:06:42 +00:00
#include <vector>
#include <Columns/ColumnArray.h>
#include <Columns/ColumnsNumber.h>
#include <DataTypes/DataTypeArray.h>
#include <DataTypes/DataTypesNumber.h>
#include <DataTypes/IDataType.h>
#include <Functions/FunctionFactory.h>
#include <Functions/IFunction.h>
#include <Common/typeid_cast.h>
2022-05-13 13:20:04 +00:00
#include <Interpreters/castColumn.h>
2020-06-19 10:06:42 +00:00
#include <h3api.h>
2019-12-05 09:42:11 +00:00
namespace DB
{
2020-08-15 08:49:54 +00:00
2020-02-25 18:10:48 +00:00
namespace ErrorCodes
{
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
2020-08-15 08:49:54 +00:00
extern const int PARAMETER_OUT_OF_BOUND;
2022-01-23 06:25:06 +00:00
extern const int ILLEGAL_COLUMN;
2020-02-25 18:10:48 +00:00
}
2020-08-15 08:49:54 +00:00
2020-09-07 18:00:37 +00:00
namespace
{
2019-12-05 09:42:11 +00:00
class FunctionH3KRing : public IFunction
{
public:
static constexpr auto name = "h3kRing";
2021-06-01 12:20:52 +00:00
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionH3KRing>(); }
2019-12-05 09:42:11 +00:00
std::string getName() const override { return name; }
size_t getNumberOfArguments() const override { return 2; }
bool useDefaultImplementationForConstants() const override { return true; }
2021-06-22 16:21:23 +00:00
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
2019-12-05 09:42:11 +00:00
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
{
2020-04-22 08:31:10 +00:00
const auto * arg = arguments[0].get();
2019-12-05 09:42:11 +00:00
if (!WhichDataType(arg).isUInt64())
throw Exception(
2021-07-13 12:54:00 +00:00
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
"Illegal type {} of argument {} of function {}. Must be UInt64",
arg->getName(), 1, getName());
2019-12-05 09:42:11 +00:00
arg = arguments[1].get();
2022-05-13 13:20:04 +00:00
if (!WhichDataType(arg).isNativeUInt())
2019-12-05 09:42:11 +00:00
throw Exception(
2021-07-13 12:54:00 +00:00
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
2022-05-13 13:20:04 +00:00
"Illegal type {} of argument {} of function {}. Must be unsigned native integer.",
2022-01-23 06:25:06 +00:00
arg->getName(),
2,
getName());
2019-12-05 09:42:11 +00:00
return std::make_shared<DataTypeArray>(std::make_shared<DataTypeUInt64>());
}
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
2019-12-05 09:42:11 +00:00
{
2022-02-18 23:16:26 +00:00
auto non_const_arguments = arguments;
for (auto & argument : non_const_arguments)
argument.column = argument.column->convertToFullColumnIfConst();
const auto * col_hindex = checkAndGetColumn<ColumnUInt64>(non_const_arguments[0].column.get());
2022-01-23 06:25:06 +00:00
if (!col_hindex)
throw Exception(
ErrorCodes::ILLEGAL_COLUMN,
"Illegal type {} of argument {} of function {}. Must be UInt64.",
arguments[0].type->getName(),
1,
getName());
const auto & data_hindex = col_hindex->getData();
2022-01-23 14:20:31 +00:00
/// ColumnUInt16 is sufficient as the max value of 2nd arg is checked (arg > 0 < 10000) in implementation below
2022-05-13 13:20:04 +00:00
auto cast_result = castColumnAccurate(non_const_arguments[1], std::make_shared<DataTypeUInt16>());
const auto * col_k = checkAndGetColumn<ColumnUInt16>(cast_result.get());
2022-01-23 06:25:06 +00:00
if (!col_k)
throw Exception(
ErrorCodes::ILLEGAL_COLUMN,
2022-01-23 14:20:31 +00:00
"Illegal type {} of argument {} of function {}. Must be UInt16.",
2022-01-23 07:01:56 +00:00
arguments[1].type->getName(),
2022-01-23 06:25:06 +00:00
2,
getName());
const auto & data_k = col_k->getData();
2019-12-05 09:42:11 +00:00
auto dst = ColumnArray::create(ColumnUInt64::create());
auto & dst_data = dst->getData();
auto & dst_offsets = dst->getOffsets();
dst_offsets.resize(input_rows_count);
auto current_offset = 0;
2021-12-20 10:32:13 +00:00
for (size_t row = 0; row < input_rows_count; ++row)
2019-12-05 09:42:11 +00:00
{
2022-01-23 06:25:06 +00:00
const H3Index origin_hindex = data_hindex[row];
const int k = data_k[row];
2019-12-05 09:42:11 +00:00
2021-06-22 09:23:27 +00:00
/// Overflow is possible. The function maxGridDiskSize does not check for overflow.
2020-08-15 08:49:54 +00:00
/// The calculation is similar to square of k but several times more.
/// Let's use huge underestimation as the safe bound. We should not allow to generate too large arrays nevertheless.
constexpr auto max_k = 10000;
if (k > max_k)
throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Too large 'k' argument for {} function, maximum {}", getName(), max_k);
2022-01-23 08:28:21 +00:00
/// Check is already made while fetching the argument for k (to determine if it's an unsigned integer). Nevertheless, it's checked again here.
2020-08-15 08:49:54 +00:00
if (k < 0)
throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Argument 'k' for {} function must be non negative", getName());
2021-06-22 09:23:27 +00:00
const auto vec_size = maxGridDiskSize(k);
std::vector<H3Index> hindex_vec;
2019-12-05 09:42:11 +00:00
hindex_vec.resize(vec_size);
2021-06-22 09:23:27 +00:00
gridDisk(origin_hindex, k, hindex_vec.data());
2019-12-05 09:42:11 +00:00
dst_data.reserve(dst_data.size() + vec_size);
for (auto hindex : hindex_vec)
{
if (hindex != 0)
{
2019-12-16 18:34:51 +00:00
++current_offset;
2019-12-05 09:42:11 +00:00
dst_data.insert(hindex);
}
}
dst_offsets[row] = current_offset;
}
2020-10-19 13:42:14 +00:00
return dst;
2019-12-05 09:42:11 +00:00
}
};
2020-09-07 18:00:37 +00:00
}
2019-12-05 09:42:11 +00:00
REGISTER_FUNCTION(H3KRing)
2019-12-05 09:42:11 +00:00
{
factory.registerFunction<FunctionH3KRing>();
}
}
2020-11-04 14:51:41 +00:00
#endif