#include #include #include #include #include #include #include #include #include #include namespace DB { namespace ErrorCodes { extern const int LOGICAL_ERROR; extern const int ILLEGAL_TYPE_OF_ARGUMENT; extern const int TOO_LARGE_ARRAY_SIZE; } class FunctionGeohashesInBox : public IFunction { public: static constexpr auto name = "geohashesInBox"; static FunctionPtr create(const Context &) { return std::make_shared(); } String getName() const override { return name; } size_t getNumberOfArguments() const override { return 5; } DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override { validateArgumentType(*this, arguments, 0, isFloat, "float"); validateArgumentType(*this, arguments, 1, isFloat, "float"); validateArgumentType(*this, arguments, 2, isFloat, "float"); validateArgumentType(*this, arguments, 3, isFloat, "float"); validateArgumentType(*this, arguments, 4, isUInt8, "integer"); if (!(arguments[0]->equals(*arguments[1]) && arguments[0]->equals(*arguments[2]) && arguments[0]->equals(*arguments[3]))) { throw Exception("Illegal type of argument of " + getName() + " all coordinate arguments must have the same type, instead they are:" + arguments[0]->getName() + ", " + arguments[1]->getName() + ", " + arguments[2]->getName() + ", " + arguments[3]->getName() + ".", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT); } return std::make_shared(std::make_shared()); } bool useDefaultImplementationForConstants() const override { return true; } template void execute(const IColumn * lon_min_column, const IColumn * lat_min_column, const IColumn * lon_max_column, const IColumn * lat_max_column, const IColumn * precision_column, ColumnPtr & result) { static constexpr size_t max_array_size = 10'000'000; const auto * lon_min = checkAndGetColumn>(lon_min_column); const auto * lat_min = checkAndGetColumn>(lat_min_column); const auto * lon_max = checkAndGetColumn>(lon_max_column); const auto * lat_max = checkAndGetColumn>(lat_max_column); auto * precision = checkAndGetColumn>(precision_column); if (precision == nullptr) { precision = checkAndGetColumnConstData>(precision_column); } if (!lon_min || !lat_min || !lon_max || !lat_max || !precision) { throw Exception("Unsupported argument types for function " + getName() + " : " + lon_min_column->getName() + ", " + lat_min_column->getName() + ", " + lon_max_column->getName() + ", " + lat_max_column->getName() + ".", ErrorCodes::LOGICAL_ERROR); } const size_t total_rows = lat_min->size(); auto col_res = ColumnArray::create(ColumnString::create()); ColumnString & res_strings = typeid_cast(col_res->getData()); ColumnArray::Offsets & res_offsets = col_res->getOffsets(); ColumnString::Chars & res_strings_chars = res_strings.getChars(); ColumnString::Offsets & res_strings_offsets = res_strings.getOffsets(); for (size_t row = 0; row < total_rows; ++row) { const Float64 lon_min_value = lon_min->getElement(row); const Float64 lat_min_value = lat_min->getElement(row); const Float64 lon_max_value = lon_max->getElement(row); const Float64 lat_max_value = lat_max->getElement(row); const auto prepared_args = GeoUtils::geohashesInBoxPrepare( lon_min_value, lat_min_value, lon_max_value, lat_max_value, precision->getElement(row % precision->size())); if (prepared_args.items_count > max_array_size) { throw Exception(getName() + " would produce " + std::to_string(prepared_args.items_count) + " array elements, which is bigger than the allowed maximum of " + std::to_string(max_array_size), ErrorCodes::TOO_LARGE_ARRAY_SIZE); } res_strings_offsets.reserve(res_strings_offsets.size() + prepared_args.items_count); res_strings_chars.resize(res_strings_chars.size() + prepared_args.items_count * (prepared_args.precision + 1)); const auto starting_offset = res_strings_offsets.empty() ? 0 : res_strings_offsets.back(); char * out = reinterpret_cast(res_strings_chars.data() + starting_offset); // Actually write geohashes into preallocated buffer. GeoUtils::geohashesInBox(prepared_args, out); for (UInt8 i = 1; i <= prepared_args.items_count ; ++i) { res_strings_offsets.push_back(starting_offset + (prepared_args.precision + 1) * i); } res_offsets.push_back((res_offsets.empty() ? 0 : res_offsets.back()) + prepared_args.items_count); } if (!res_strings_offsets.empty() && res_strings_offsets.back() != res_strings_chars.size()) { throw Exception("String column size mismatch (internal logical error)", ErrorCodes::LOGICAL_ERROR); } if (!res_offsets.empty() && res_offsets.back() != res_strings.size()) { throw Exception("Arrary column size mismatch (internal logical error)" + std::to_string(res_offsets.back()) + " != " + std::to_string(res_strings.size()), ErrorCodes::LOGICAL_ERROR); } result = std::move(col_res); } void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) override { const IColumn * lon_min = block.getByPosition(arguments[0]).column.get(); const IColumn * lat_min = block.getByPosition(arguments[1]).column.get(); const IColumn * lon_max = block.getByPosition(arguments[2]).column.get(); const IColumn * lat_max = block.getByPosition(arguments[3]).column.get(); const IColumn * prec = block.getByPosition(arguments[4]).column.get(); ColumnPtr & res = block.getByPosition(result).column; if (checkColumn>(lon_min)) { execute(lon_min, lat_min, lon_max, lat_max, prec, res); } else { execute(lon_min, lat_min, lon_max, lat_max, prec, res); } } }; void registerFunctionGeohashesInBox(FunctionFactory & factory) { factory.registerFunction(); } }