#pragma once #include #include namespace DB { template struct MultiSearchFirstPositionImpl { using ResultType = UInt64; static constexpr bool is_using_hyperscan = false; /// Variable for understanding, if we used offsets for the output, most /// likely to determine whether the function returns ColumnVector of ColumnArray. static constexpr bool is_column_array = false; static auto getReturnType() { return std::make_shared>(); } static void vectorConstant( const ColumnString::Chars & haystack_data, const ColumnString::Offsets & haystack_offsets, const std::vector & needles, PaddedPODArray & res, [[maybe_unused]] PaddedPODArray & offsets) { auto res_callback = [](const UInt8 * start, const UInt8 * end) -> UInt64 { return 1 + Impl::countChars(reinterpret_cast(start), reinterpret_cast(end)); }; auto searcher = Impl::createMultiSearcherInBigHaystack(needles); const size_t haystack_string_size = haystack_offsets.size(); res.resize(haystack_string_size); size_t iteration = 0; while (searcher.hasMoreToSearch()) { size_t prev_offset = 0; for (size_t j = 0; j < haystack_string_size; ++j) { const auto * haystack = &haystack_data[prev_offset]; const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1; if (iteration == 0 || res[j] == 0) res[j] = searcher.searchOneFirstPosition(haystack, haystack_end, res_callback); else { UInt64 result = searcher.searchOneFirstPosition(haystack, haystack_end, res_callback); if (result != 0) res[j] = std::min(result, res[j]); } prev_offset = haystack_offsets[j]; } ++iteration; } } }; }