Merge branch 'master' into database_atomic

2024-12-11 17:02:25 +00:00 · 2020-03-30 17:53:40 +03:00 · 2020-03-30 17:53:40 +03:00 · 731aeb2dbe
commit 731aeb2dbe
parent 0eb351044c 621bcaf2eb
681 changed files with 91278 additions and 2027 deletions
--- a/README.md
+++ b/README.md
@ -18,3 +18,4 @@ ClickHouse is an open-source column-oriented database management system that all
 * [ClickHouse Workshop in Novosibirsk](https://2020.codefest.ru/lecture/1628) on TBD date.
 * [Talks on Saint HighLoad++ in St. Petersburg](https://www.highload.ru/spb/2020/abstracts/6647) on TBD date.
 * [Yandex C++ Open-Source Sprints in Moscow](https://events.yandex.ru/events/otkrytyj-kod-v-yandek-28-03-2020) on TBD date.
 * [ClickHouse in Avito (online in Russian)](https://avitotech.timepad.ru/event/1290051/) on April 9, 2020.
--- a/base/daemon/BaseDaemon.cpp
+++ b/base/daemon/BaseDaemon.cpp
@ -367,137 +367,7 @@ void BaseDaemon::reloadConfiguration()
 }
-namespace
+BaseDaemon::BaseDaemon() = default;
 {
 enum class InstructionFail
 {
    NONE = 0,
    SSE3 = 1,
    SSSE3 = 2,
    SSE4_1 = 3,
    SSE4_2 = 4,
    AVX = 5,
    AVX2 = 6,
    AVX512 = 7
 };
 std::string instructionFailToString(InstructionFail fail)
 {
    switch (fail)
    {
        case InstructionFail::NONE:
            return "NONE";
        case InstructionFail::SSE3:
            return "SSE3";
        case InstructionFail::SSSE3:
            return "SSSE3";
        case InstructionFail::SSE4_1:
            return "SSE4.1";
        case InstructionFail::SSE4_2:
            return "SSE4.2";
        case InstructionFail::AVX:
            return "AVX";
        case InstructionFail::AVX2:
            return "AVX2";
        case InstructionFail::AVX512:
            return "AVX512";
    }
    __builtin_unreachable();
 }
 sigjmp_buf jmpbuf;
 void sigIllCheckHandler(int, siginfo_t *, void *)
 {
    siglongjmp(jmpbuf, 1);
 }
 /// Check if necessary sse extensions are available by trying to execute some sse instructions.
 /// If instruction is unavailable, SIGILL will be sent by kernel.
 void checkRequiredInstructionsImpl(volatile InstructionFail & fail)
 {
 #if __SSE3__
    fail = InstructionFail::SSE3;
    __asm__ volatile ("addsubpd %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if __SSSE3__
    fail = InstructionFail::SSSE3;
    __asm__ volatile ("pabsw %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if __SSE4_1__
    fail = InstructionFail::SSE4_1;
    __asm__ volatile ("pmaxud %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if __SSE4_2__
    fail = InstructionFail::SSE4_2;
    __asm__ volatile ("pcmpgtq %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if __AVX__
    fail = InstructionFail::AVX;
    __asm__ volatile ("vaddpd %%ymm0, %%ymm0, %%ymm0" : : : "ymm0");
 #endif
 #if __AVX2__
    fail = InstructionFail::AVX2;
    __asm__ volatile ("vpabsw %%ymm0, %%ymm0" : : : "ymm0");
 #endif
 #if __AVX512__
    fail = InstructionFail::AVX512;
    __asm__ volatile ("vpabsw %%zmm0, %%zmm0" : : : "zmm0");
 #endif
    fail = InstructionFail::NONE;
 }
 /// Check SSE and others instructions availability
 /// Calls exit on fail
 void checkRequiredInstructions()
 {
    struct sigaction sa{};
    struct sigaction sa_old{};
    sa.sa_sigaction = sigIllCheckHandler;
    sa.sa_flags = SA_SIGINFO;
    auto signal = SIGILL;
    if (sigemptyset(&sa.sa_mask) != 0
        || sigaddset(&sa.sa_mask, signal) != 0
        || sigaction(signal, &sa, &sa_old) != 0)
    {
        std::cerr << "Can not set signal handler\n";
        exit(1);
    }
    volatile InstructionFail fail = InstructionFail::NONE;
    if (sigsetjmp(jmpbuf, 1))
    {
        std::cerr << "Instruction check fail. There is no " << instructionFailToString(fail) << " instruction set\n";
        exit(1);
    }
    checkRequiredInstructionsImpl(fail);
    if (sigaction(signal, &sa_old, nullptr))
    {
        std::cerr << "Can not set signal handler\n";
        exit(1);
    }
 }
 }
 BaseDaemon::BaseDaemon()
 {
    checkRequiredInstructions();
 }
 BaseDaemon::~BaseDaemon()
--- a/dbms/programs/copier/Aliases.h
+++ b/dbms/programs/copier/Aliases.h
@ -3,19 +3,21 @@
 #include <Interpreters/Cluster.h>
 namespace DB
 {
    using ConfigurationPtr = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
    using DatabaseAndTableName = std::pair<String, String>;
    using ListOfDatabasesAndTableNames = std::vector<DatabaseAndTableName>;
    /// Hierarchical description of the tasks
    struct ShardPartitionPiece;
    struct ShardPartition;
    struct TaskShard;
    struct TaskTable;
    struct TaskCluster;
    struct ClusterPartition;
    using PartitionPieces = std::vector<ShardPartitionPiece>;
    using TasksPartition = std::map<String, ShardPartition, std::greater<>>;
    using ShardInfo = Cluster::ShardInfo;
    using TaskShardPtr = std::shared_ptr<TaskShard>;
--- a/dbms/programs/copier/CMakeLists.txt
+++ b/dbms/programs/copier/CMakeLists.txt
@ -12,6 +12,6 @@ set(CLICKHOUSE_COPIER_LINK PRIVATE
        clickhouse_dictionaries
        string_utils ${Poco_XML_LIBRARY} PUBLIC daemon)
-set(CLICKHOUSE_COPIER_INCLUDE SYSTEM PRIVATE ${PCG_RANDOM_INCLUDE_DIR})
+set(CLICKHOUSE_COPIER_INCLUDE SYSTEM PRIVATE ${PCG_RANDOM_INCLUDE_DIR} ${CMAKE_CURRENT_SOURCE_DIR})
 clickhouse_program_add(copier)
--- a/dbms/programs/copier/ClusterCopier.cpp
+++ b/dbms/programs/copier/ClusterCopier.cpp
--- a/dbms/programs/copier/ClusterCopier.h
+++ b/dbms/programs/copier/ClusterCopier.h
@ -5,8 +5,10 @@
 #include "TaskCluster.h"
 #include "TaskTableAndShard.h"
 #include "ShardPartition.h"
 #include "ShardPartitionPiece.h"
 #include "ZooKeeperStaff.h"
 namespace DB
 {
@ -27,10 +29,10 @@ public:
    void init();
-    template<typename T>
+    template <typename T>
    decltype(auto) retry(T && func, UInt64 max_tries = 100);
-    void discoverShardPartitions(const ConnectionTimeouts & timeouts, const TaskShardPtr & task_shard) ;
+    void discoverShardPartitions(const ConnectionTimeouts & timeouts, const TaskShardPtr & task_shard);
    /// Compute set of partitions, assume set of partitions aren't changed during the processing
    void discoverTablePartitions(const ConnectionTimeouts & timeouts, TaskTable & task_table, UInt64 num_threads = 0);
@ -54,6 +56,10 @@ public:
        copy_fault_probability = copy_fault_probability_;
    }
    void setMoveFaultProbability(double move_fault_probability_)
    {
        move_fault_probability = move_fault_probability_;
    }
 protected:
@ -73,59 +79,102 @@ protected:
    }
    zkutil::EphemeralNodeHolder::Ptr createTaskWorkerNodeAndWaitIfNeed(
-            const zkutil::ZooKeeperPtr &zookeeper,
+            const zkutil::ZooKeeperPtr & zookeeper,
-            const String &description,
+            const String & description,
            bool unprioritized);
    /*
     * Checks that partition piece or some other entity is clean.
     * The only requirement is that you have to pass is_dirty_flag_path and is_dirty_cleaned_path to the function.
     * And is_dirty_flag_path is a parent of is_dirty_cleaned_path.
     * */
    static bool checkPartitionPieceIsClean(
            const zkutil::ZooKeeperPtr & zookeeper,
            const CleanStateClock & clean_state_clock,
            const String & task_status_path);
    bool checkAllPiecesInPartitionAreDone(const TaskTable & task_table, const String & partition_name, const TasksShard & shards_with_partition);
    /** Checks that the whole partition of a table was copied. We should do it carefully due to dirty lock.
     * State of some task could change during the processing.
     * We have to ensure that all shards have the finished state and there is no dirty flag.
     * Moreover, we have to check status twice and check zxid, because state can change during the checking.
     */
-    bool checkPartitionIsDone(const TaskTable & task_table, const String & partition_name,
+
-                              const TasksShard & shards_with_partition);
+    /* The same as function above
     * Assume that we don't know on which shards do we have partition certain piece.
     * We'll check them all (I mean shards that contain the whole partition)
     * And shards that don't have certain piece MUST mark that piece is_done true.
     * */
    bool checkPartitionPieceIsDone(const TaskTable & task_table, const String & partition_name,
                                   size_t piece_number, const TasksShard & shards_with_partition);
    /*Alter successful insertion to helping tables it will move all pieces to destination table*/
    TaskStatus tryMoveAllPiecesToDestinationTable(const TaskTable & task_table, const String & partition_name);
    /// Removes MATERIALIZED and ALIAS columns from create table query
-    static ASTPtr removeAliasColumnsFromCreateQuery(const ASTPtr &query_ast);
+    static ASTPtr removeAliasColumnsFromCreateQuery(const ASTPtr & query_ast);
    bool tryDropPartition(ShardPartition & task_partition,
                          const zkutil::ZooKeeperPtr & zookeeper,
                          const CleanStateClock & clean_state_clock);
    bool tryDropPartitionPiece(ShardPartition & task_partition, const size_t current_piece_number,
            const zkutil::ZooKeeperPtr & zookeeper, const CleanStateClock & clean_state_clock);
    static constexpr UInt64 max_table_tries = 1000;
    static constexpr UInt64 max_shard_partition_tries = 600;
    static constexpr UInt64 max_shard_partition_piece_tries_for_alter = 100;
    bool tryProcessTable(const ConnectionTimeouts & timeouts, TaskTable & task_table);
-    PartitionTaskStatus tryProcessPartitionTask(const ConnectionTimeouts & timeouts,
+    /// Job for copying partition from particular shard.
-                                                ShardPartition & task_partition,
+    TaskStatus tryProcessPartitionTask(const ConnectionTimeouts & timeouts,
-                                                bool is_unprioritized_task);
+                                       ShardPartition & task_partition,
                                       bool is_unprioritized_task);
-    PartitionTaskStatus processPartitionTaskImpl(const ConnectionTimeouts & timeouts,
+    TaskStatus iterateThroughAllPiecesInPartition(const ConnectionTimeouts & timeouts,
-                                                 ShardPartition & task_partition,
+                                                  ShardPartition & task_partition,
-                                                 bool is_unprioritized_task);
+                                                  bool is_unprioritized_task);
    TaskStatus processPartitionPieceTaskImpl(const ConnectionTimeouts & timeouts,
                                             ShardPartition & task_partition,
                                             const size_t current_piece_number,
                                             bool is_unprioritized_task);
    void dropAndCreateLocalTable(const ASTPtr & create_ast);
-    void dropLocalTableIfExists (const DatabaseAndTableName & table_name) const;
+    void dropLocalTableIfExists(const DatabaseAndTableName & table_name) const;
-    String getRemoteCreateTable(const DatabaseAndTableName & table,
+    void dropHelpingTables(const TaskTable & task_table);
-                                Connection & connection,
+
-                                const Settings * settings = nullptr);
+    /// Is used for usage less disk space.
    /// After all pieces were successfully moved to original destination
    /// table we can get rid of partition pieces (partitions in helping tables).
    void dropParticularPartitionPieceFromAllHelpingTables(const TaskTable & task_table, const String & partition_name);
    String getRemoteCreateTable(const DatabaseAndTableName & table, Connection & connection, const Settings * settings = nullptr);
    ASTPtr getCreateTableForPullShard(const ConnectionTimeouts & timeouts, TaskShard & task_shard);
-    void createShardInternalTables(const ConnectionTimeouts & timeouts,
+    /// If it is implicitly asked to create split Distributed table for certain piece on current shard, we will do it.
-                                   TaskShard & task_shard,
+    void createShardInternalTables(const ConnectionTimeouts & timeouts, TaskShard & task_shard, bool create_split = true);
                                   bool create_split = true);
-    std::set<String> getShardPartitions(const ConnectionTimeouts & timeouts,
+    std::set<String> getShardPartitions(const ConnectionTimeouts & timeouts, TaskShard & task_shard);
                                        TaskShard & task_shard);
-    bool checkShardHasPartition(const ConnectionTimeouts & timeouts,
+    bool checkShardHasPartition(const ConnectionTimeouts & timeouts, TaskShard & task_shard, const String & partition_quoted_name);
-                                TaskShard & task_shard,
+
-                                const String & partition_quoted_name);
+    bool checkPresentPartitionPiecesOnCurrentShard(const ConnectionTimeouts & timeouts,
             TaskShard & task_shard, const String & partition_quoted_name, size_t current_piece_number);
    /*
     * This class is used in executeQueryOnCluster function
     * You can execute query on each shard (no sense it is executed on each replica of a shard or not)
     * or you can execute query on each replica on each shard.
     * First mode is useful for INSERTS queries.
     * */
    enum ClusterExecutionMode
    {
        ON_EACH_SHARD,
        ON_EACH_NODE
    };
    /** Executes simple query (without output streams, for example DDL queries) on each shard of the cluster
      * Returns number of shards for which at least one replica executed query successfully
@ -136,6 +185,7 @@ protected:
            const ASTPtr & query_ast_ = nullptr,
            const Settings * settings = nullptr,
            PoolMode pool_mode = PoolMode::GET_ALL,
            ClusterExecutionMode execution_mode = ClusterExecutionMode::ON_EACH_SHARD,
            UInt64 max_successful_executions_per_shard = 0) const;
 private:
@ -145,25 +195,25 @@ private:
    String working_database_name;
    /// Auto update config stuff
-    UInt64 task_descprtion_current_version = 1;
+    UInt64 task_description_current_version = 1;
-    std::atomic<UInt64> task_descprtion_version{1};
+    std::atomic<UInt64> task_description_version{1};
    Coordination::WatchCallback task_description_watch_callback;
    /// ZooKeeper session used to set the callback
    zkutil::ZooKeeperPtr task_description_watch_zookeeper;
    ConfigurationPtr task_cluster_initial_config;
    ConfigurationPtr task_cluster_current_config;
-    Coordination::Stat task_descprtion_current_stat{};
+    Coordination::Stat task_description_current_stat{};
    std::unique_ptr<TaskCluster> task_cluster;
    bool is_safe_mode = false;
    double copy_fault_probability = 0.0;
    double move_fault_probability = 0.0;
    Context & context;
    Poco::Logger * log;
    std::chrono::milliseconds default_sleep_time{1000};
 };
 }
--- a/dbms/programs/copier/ClusterCopierApp.cpp
+++ b/dbms/programs/copier/ClusterCopierApp.cpp
@ -17,6 +17,8 @@ void ClusterCopierApp::initialize(Poco::Util::Application & self)
    is_safe_mode = config().has("safe-mode");
    if (config().has("copy-fault-probability"))
        copy_fault_probability = std::max(std::min(config().getDouble("copy-fault-probability"), 1.0), 0.0);
    if (config().has("move-fault-probability"))
        move_fault_probability = std::max(std::min(config().getDouble("move-fault-probability"), 1.0), 0.0);
    base_dir = (config().has("base-dir")) ? config().getString("base-dir") : Poco::Path::current();
    // process_id is '<hostname>#<start_timestamp>_<pid>'
    time_t timestamp = Poco::Timestamp().epochTime();
@ -58,23 +60,25 @@ void ClusterCopierApp::defineOptions(Poco::Util::OptionSet & options)
    Base::defineOptions(options);
    options.addOption(Poco::Util::Option("task-path", "", "path to task in ZooKeeper")
-                              .argument("task-path").binding("task-path"));
+                          .argument("task-path").binding("task-path"));
    options.addOption(Poco::Util::Option("task-file", "", "path to task file for uploading in ZooKeeper to task-path")
-                              .argument("task-file").binding("task-file"));
+                          .argument("task-file").binding("task-file"));
    options.addOption(Poco::Util::Option("task-upload-force", "", "Force upload task-file even node already exists")
-                              .argument("task-upload-force").binding("task-upload-force"));
+                          .argument("task-upload-force").binding("task-upload-force"));
    options.addOption(Poco::Util::Option("safe-mode", "", "disables ALTER DROP PARTITION in case of errors")
-                              .binding("safe-mode"));
+                          .binding("safe-mode"));
    options.addOption(Poco::Util::Option("copy-fault-probability", "", "the copying fails with specified probability (used to test partition state recovering)")
-                              .argument("copy-fault-probability").binding("copy-fault-probability"));
+                          .argument("copy-fault-probability").binding("copy-fault-probability"));
    options.addOption(Poco::Util::Option("move-fault-probability", "", "the moving fails with specified probability (used to test partition state recovering)")
                              .argument("move-fault-probability").binding("move-fault-probability"));
    options.addOption(Poco::Util::Option("log-level", "", "sets log level")
-                              .argument("log-level").binding("log-level"));
+                          .argument("log-level").binding("log-level"));
    options.addOption(Poco::Util::Option("base-dir", "", "base directory for copiers, consecutive copier launches will populate /base-dir/launch_id/* directories")
-                              .argument("base-dir").binding("base-dir"));
+                          .argument("base-dir").binding("base-dir"));
    using Me = std::decay_t<decltype(*this)>;
    options.addOption(Poco::Util::Option("help", "", "produce this help message").binding("help")
-                              .callback(Poco::Util::OptionCallback<Me>(this, &Me::handleHelp)));
+                          .callback(Poco::Util::OptionCallback<Me>(this, &Me::handleHelp)));
 }
@ -85,10 +89,10 @@ void ClusterCopierApp::mainImpl()
    auto log = &logger();
    LOG_INFO(log, "Starting clickhouse-copier ("
-            << "id " << process_id << ", "
+        << "id " << process_id << ", "
-            << "host_id " << host_id << ", "
+        << "host_id " << host_id << ", "
-            << "path " << process_path << ", "
+        << "path " << process_path << ", "
-            << "revision " << ClickHouseRevision::get() << ")");
+        << "revision " << ClickHouseRevision::get() << ")");
    auto context = std::make_unique<Context>(Context::createGlobal());
    context->makeGlobalContext();
@ -115,6 +119,7 @@ void ClusterCopierApp::mainImpl()
    auto copier = std::make_unique<ClusterCopier>(task_path, host_id, default_database, *context);
    copier->setSafeMode(is_safe_mode);
    copier->setCopyFaultProbability(copy_fault_probability);
    copier->setMoveFaultProbability(move_fault_probability);
    auto task_file = config().getString("task-file", "");
    if (!task_file.empty())
--- a/dbms/programs/copier/ClusterCopierApp.h
+++ b/dbms/programs/copier/ClusterCopierApp.h
@ -78,7 +78,8 @@ private:
    std::string task_path;
    std::string log_level = "trace";
    bool is_safe_mode = false;
-    double copy_fault_probability = 0;
+    double copy_fault_probability = 0.0;
    double move_fault_probability = 0.0;
    bool is_help = false;
    std::string base_dir;
--- a/dbms/programs/copier/Internals.cpp
+++ b/dbms/programs/copier/Internals.cpp
@ -1,4 +1,5 @@
 #include "Internals.h"
 #include <Storages/MergeTree/MergeTreeData.h>
 namespace DB
 {
@ -7,6 +8,8 @@ namespace ErrorCodes
    extern const int BAD_ARGUMENTS;
 }
 using ConfigurationPtr = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
 ConfigurationPtr getConfigurationFromXMLString(const std::string & xml_data)
 {
    std::stringstream ss(xml_data);
@ -14,7 +17,6 @@ ConfigurationPtr getConfigurationFromXMLString(const std::string & xml_data)
    return {new Poco::Util::XMLConfiguration{&input_source}};
 }
 String getQuotedTable(const String & database, const String & table)
 {
    if (database.empty())
@ -114,6 +116,142 @@ ASTPtr extractPartitionKey(const ASTPtr & storage_ast)
    }
 }
 ASTPtr extractPrimaryKey(const ASTPtr & storage_ast)
 {
    String storage_str = queryToString(storage_ast);
    const auto & storage = storage_ast->as<ASTStorage &>();
    const auto & engine = storage.engine->as<ASTFunction &>();
    if (!endsWith(engine.name, "MergeTree"))
    {
        throw Exception("Unsupported engine was specified in " + storage_str + ", only *MergeTree engines are supported",
                        ErrorCodes::BAD_ARGUMENTS);
    }
    if (!isExtendedDefinitionStorage(storage_ast))
    {
        throw Exception("Is not extended deginition storage " + storage_str + " Will be fixed later.",
                        ErrorCodes::BAD_ARGUMENTS);
    }
    if (storage.primary_key)
        return storage.primary_key->clone();
    return nullptr;
 }
 ASTPtr extractOrderBy(const ASTPtr & storage_ast)
 {
    String storage_str = queryToString(storage_ast);
    const auto & storage = storage_ast->as<ASTStorage &>();
    const auto & engine = storage.engine->as<ASTFunction &>();
    if (!endsWith(engine.name, "MergeTree"))
    {
        throw Exception("Unsupported engine was specified in " + storage_str + ", only *MergeTree engines are supported",
                        ErrorCodes::BAD_ARGUMENTS);
    }
    if (!isExtendedDefinitionStorage(storage_ast))
    {
        throw Exception("Is not extended deginition storage " + storage_str + " Will be fixed later.",
                        ErrorCodes::BAD_ARGUMENTS);
    }
    if (storage.order_by)
        return storage.order_by->clone();
    throw Exception("ORDER BY cannot be empty", ErrorCodes::BAD_ARGUMENTS);
 }
 String createCommaSeparatedStringFrom(const Names & names)
 {
    std::ostringstream ss;
    if (!names.empty())
    {
        std::copy(names.begin(), std::prev(names.end()), std::ostream_iterator<std::string>(ss, ", "));
        ss << names.back();
    }
    return ss.str();
 }
 Names extractPrimaryKeyColumnNames(const ASTPtr & storage_ast)
 {
    const auto sorting_key_ast = extractOrderBy(storage_ast);
    const auto primary_key_ast = extractPrimaryKey(storage_ast);
    const auto sorting_key_expr_list = MergeTreeData::extractKeyExpressionList(sorting_key_ast);
    const auto primary_key_expr_list = primary_key_ast
                           ? MergeTreeData::extractKeyExpressionList(primary_key_ast) : sorting_key_expr_list->clone();
    /// Maybe we have to handle VersionedCollapsing engine separately. But in our case in looks pointless.
    size_t primary_key_size = primary_key_expr_list->children.size();
    size_t sorting_key_size = sorting_key_expr_list->children.size();
    if (primary_key_size > sorting_key_size)
        throw Exception("Primary key must be a prefix of the sorting key, but its length: "
                        + toString(primary_key_size) + " is greater than the sorting key length: " + toString(sorting_key_size),
                        ErrorCodes::BAD_ARGUMENTS);
    Names primary_key_columns;
    Names sorting_key_columns;
    NameSet primary_key_columns_set;
    for (size_t i = 0; i < sorting_key_size; ++i)
    {
        String sorting_key_column = sorting_key_expr_list->children[i]->getColumnName();
        sorting_key_columns.push_back(sorting_key_column);
        if (i < primary_key_size)
        {
            String pk_column = primary_key_expr_list->children[i]->getColumnName();
            if (pk_column != sorting_key_column)
                throw Exception("Primary key must be a prefix of the sorting key, but in position "
                                + toString(i) + " its column is " + pk_column + ", not " + sorting_key_column,
                                ErrorCodes::BAD_ARGUMENTS);
            if (!primary_key_columns_set.emplace(pk_column).second)
                throw Exception("Primary key contains duplicate columns", ErrorCodes::BAD_ARGUMENTS);
            primary_key_columns.push_back(pk_column);
        }
    }
    return primary_key_columns;
 }
 String extractReplicatedTableZookeeperPath(const ASTPtr & storage_ast)
 {
    String storage_str = queryToString(storage_ast);
    const auto & storage = storage_ast->as<ASTStorage &>();
    const auto & engine = storage.engine->as<ASTFunction &>();
    if (!endsWith(engine.name, "MergeTree"))
    {
        throw Exception(
                "Unsupported engine was specified in " + storage_str + ", only *MergeTree engines are supported",
                ErrorCodes::BAD_ARGUMENTS);
    }
    if (!startsWith(engine.name, "Replicated"))
    {
        return "";
    }
    auto replicated_table_arguments = engine.arguments->children;
    auto zk_table_path_ast = replicated_table_arguments[0]->as<ASTLiteral &>();
    auto zk_table_path_string = zk_table_path_ast.value.safeGet<String>();
    return zk_table_path_string;
 }
 ShardPriority getReplicasPriority(const Cluster::Addresses & replicas, const std::string & local_hostname, UInt8 random)
 {
    ShardPriority res;
--- a/dbms/programs/copier/Internals.h
+++ b/dbms/programs/copier/Internals.h
@ -31,6 +31,7 @@
 #include <Common/ThreadStatus.h>
 #include <Client/Connection.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/Cluster.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterExistsQuery.h>
 #include <Interpreters/InterpreterShowCreateQuery.h>
@ -144,15 +145,15 @@ struct ShardPriority
    }
 };
-/// Execution status of a task
+/// Execution status of a task.
-enum class PartitionTaskStatus
+/// Is used for: partition copying task status, partition piece copying task status, partition moving task status.
 enum class TaskStatus
 {
    Active,
    Finished,
    Error,
 };
 struct MultiTransactionInfo
 {
    int32_t code;
@ -174,6 +175,35 @@ bool isExtendedDefinitionStorage(const ASTPtr & storage_ast);
 ASTPtr extractPartitionKey(const ASTPtr & storage_ast);
 /*
 * Choosing a Primary Key that Differs from the Sorting Key
 * It is possible to specify a primary key (an expression with values that are written in the index file for each mark)
 * that is different from the sorting key (an expression for sorting the rows in data parts).
 * In this case the primary key expression tuple must be a prefix of the sorting key expression tuple.
 * This feature is helpful when using the SummingMergeTree and AggregatingMergeTree table engines.
 * In a common case when using these engines, the table has two types of columns: dimensions and measures.
 * Typical queries aggregate values of measure columns with arbitrary GROUP BY and filtering by dimensions.
 * Because SummingMergeTree and AggregatingMergeTree aggregate rows with the same value of the sorting key,
 * it is natural to add all dimensions to it. As a result, the key expression consists of a long list of columns
 * and this list must be frequently updated with newly added dimensions.
 * In this case it makes sense to leave only a few columns in the primary key that will provide efficient
 * range scans and add the remaining dimension columns to the sorting key tuple.
 * ALTER of the sorting key is a lightweight operation because when a new column is simultaneously added t
 * o the table and to the sorting key, existing data parts don't need to be changed.
 * Since the old sorting key is a prefix of the new sorting key and there is no data in the newly added column,
 * the data is sorted by both the old and new sorting keys at the moment of table modification.
 *
 * */
 ASTPtr extractPrimaryKey(const ASTPtr & storage_ast);
 ASTPtr extractOrderBy(const ASTPtr & storage_ast);
 String createCommaSeparatedStringFrom(const Names & names);
 Names extractPrimaryKeyColumnNames(const ASTPtr & storage_ast);
 String extractReplicatedTableZookeeperPath(const ASTPtr & storage_ast);
 ShardPriority getReplicasPriority(const Cluster::Addresses & replicas, const std::string & local_hostname, UInt8 random);
 }
--- a/dbms/programs/copier/ShardPartition.h
+++ b/dbms/programs/copier/ShardPartition.h
@ -1,24 +1,46 @@
 #pragma once
 #include "Aliases.h"
 #include "TaskTableAndShard.h"
 namespace DB
 {
 /// Just destination partition of a shard
 /// I don't know what this comment means.
 /// In short, when we discovered what shards contain currently processing partition,
 /// This class describes a partition (name) that is stored on the shard (parent).
 struct ShardPartition
 {
-    ShardPartition(TaskShard & parent, const String & name_quoted_) : task_shard(parent), name(name_quoted_) {}
+    ShardPartition(TaskShard &parent, String name_quoted_, size_t number_of_splits = 10)
            : task_shard(parent), name(std::move(name_quoted_)) { pieces.reserve(number_of_splits); }
    String getPartitionPath() const;
    String getPartitionPiecePath(size_t current_piece_number) const;
    String getPartitionCleanStartPath() const;
    String getPartitionPieceCleanStartPath(size_t current_piece_number) const;
    String getCommonPartitionIsDirtyPath() const;
    String getCommonPartitionIsCleanedPath() const;
    String getPartitionActiveWorkersPath() const;
    String getActiveWorkerPath() const;
    String getPartitionShardsPath() const;
    String getShardStatusPath() const;
    /// What partition pieces are present in current shard.
    /// FYI: Piece is a part of partition which has modulo equals to concrete constant (less than number_of_splits obliously)
    /// For example SELECT ... from ... WHERE partition=current_partition AND cityHash64(*) == const;
    /// Absent pieces have field is_absent_piece equals to true.
    PartitionPieces pieces;
    TaskShard & task_shard;
    String name;
 };
@ -28,11 +50,23 @@ inline String ShardPartition::getPartitionCleanStartPath() const
    return getPartitionPath() + "/clean_start";
 }
 inline String ShardPartition::getPartitionPieceCleanStartPath(size_t current_piece_number) const
 {
    assert(current_piece_number < task_shard.task_table.number_of_splits);
    return getPartitionPiecePath(current_piece_number) + "/clean_start";
 }
 inline String ShardPartition::getPartitionPath() const
 {
    return task_shard.task_table.getPartitionPath(name);
 }
 inline String ShardPartition::getPartitionPiecePath(size_t current_piece_number) const
 {
    assert(current_piece_number < task_shard.task_table.number_of_splits);
    return task_shard.task_table.getPartitionPiecePath(name, current_piece_number);
 }
 inline String ShardPartition::getShardStatusPath() const
 {
    // schema: /<root...>/tables/<table>/<partition>/shards/<shard>
--- a/dbms/programs/copier/ShardPartitionPiece.h
+++ b/dbms/programs/copier/ShardPartitionPiece.h
@ -0,0 +1,88 @@
 #pragma once
 #include "Internals.h"
 namespace DB
 {
 struct ShardPartitionPiece
 {
    ShardPartitionPiece(ShardPartition &parent, size_t current_piece_number_, bool is_present_piece_)
            : is_absent_piece(!is_present_piece_), current_piece_number(current_piece_number_),
              shard_partition(parent) {}
    String getPartitionPiecePath() const;
    String getPartitionPieceCleanStartPath() const;
    String getPartitionPieceIsDirtyPath() const;
    String getPartitionPieceIsCleanedPath() const;
    String getPartitionPieceActiveWorkersPath() const;
    String getActiveWorkerPath() const ;
    /// On what shards do we have current partition.
    String getPartitionPieceShardsPath() const;
    String getShardStatusPath() const;
    String getPartitionPieceCleanerPath() const;
    bool is_absent_piece;
    const size_t current_piece_number;
    ShardPartition & shard_partition;
 };
 inline String ShardPartitionPiece::getPartitionPiecePath() const
 {
    return shard_partition.getPartitionPath() + "/piece_" + toString(current_piece_number);
 }
 inline String ShardPartitionPiece::getPartitionPieceCleanStartPath() const
 {
    return getPartitionPiecePath() + "/clean_start";
 }
 inline String ShardPartitionPiece::getPartitionPieceIsDirtyPath() const
 {
    return getPartitionPiecePath() + "/is_dirty";
 }
 inline String ShardPartitionPiece::getPartitionPieceIsCleanedPath() const
 {
    return getPartitionPieceIsDirtyPath() + "/cleaned";
 }
 inline String ShardPartitionPiece::getPartitionPieceActiveWorkersPath() const
 {
    return getPartitionPiecePath() + "/partition_piece_active_workers";
 }
 inline String ShardPartitionPiece::getActiveWorkerPath() const
 {
    return getPartitionPieceActiveWorkersPath() + "/" + toString(shard_partition.task_shard.numberInCluster());
 }
 /// On what shards do we have current partition.
 inline String ShardPartitionPiece::getPartitionPieceShardsPath() const
 {
    return getPartitionPiecePath() + "/shards";
 }
 inline String ShardPartitionPiece::getShardStatusPath() const
 {
    return getPartitionPieceShardsPath() + "/" + toString(shard_partition.task_shard.numberInCluster());
 }
 inline String ShardPartitionPiece::getPartitionPieceCleanerPath() const
 {
    return getPartitionPieceIsDirtyPath() + "/cleaner";
 }
 }
--- a/dbms/programs/copier/TaskTableAndShard.h
+++ b/dbms/programs/copier/TaskTableAndShard.h
@ -21,16 +21,44 @@ struct TaskTable
    TaskCluster & task_cluster;
    /// These functions used in checkPartitionIsDone() or checkPartitionPieceIsDone()
    /// They are implemented here not to call task_table.tasks_shard[partition_name].second.pieces[current_piece_number] etc.
    String getPartitionPath(const String & partition_name) const;
-    String getPartitionIsDirtyPath(const String & partition_name) const;
+
-    String getPartitionIsCleanedPath(const String & partition_name) const;
+    String getPartitionAttachIsActivePath(const String & partition_name) const;
-    String getPartitionTaskStatusPath(const String & partition_name) const;
+
    String getPartitionAttachIsDonePath(const String & partition_name) const;
    String getPartitionPiecePath(const String & partition_name, const size_t piece_number) const;
    String getCertainPartitionIsDirtyPath(const String & partition_name) const;
    String getCertainPartitionPieceIsDirtyPath(const String & partition_name, const size_t piece_number) const;
    String getCertainPartitionIsCleanedPath(const String & partition_name) const;
    String getCertainPartitionPieceIsCleanedPath(const String & partition_name, const size_t piece_number) const;
    String getCertainPartitionTaskStatusPath(const String & partition_name) const;
    String getCertainPartitionPieceTaskStatusPath(const String & partition_name, const size_t piece_number) const;
    bool isReplicatedTable() const { return engine_push_zk_path != ""; }
    /// Partitions will be splitted into number-of-splits pieces.
    /// Each piece will be copied independently. (10 by default)
    size_t number_of_splits;
    String name_in_config;
    /// Used as task ID
    String table_id;
    /// Column names in primary key
    String primary_key_comma_separated;
    /// Source cluster and table
    String cluster_pull_name;
    DatabaseAndTableName table_pull;
@ -40,14 +68,31 @@ struct TaskTable
    DatabaseAndTableName table_push;
    /// Storage of destination table
    /// (tables that are stored on each shard of target cluster)
    String engine_push_str;
    ASTPtr engine_push_ast;
    ASTPtr engine_push_partition_key_ast;
-    /// A Distributed table definition used to split data
+    /// First argument of Replicated...MergeTree()
    String engine_push_zk_path;
    ASTPtr rewriteReplicatedCreateQueryToPlain();
    /*
     * A Distributed table definition used to split data
     * Distributed table will be created on each shard of default
     * cluster to perform data copying and resharding
     * */
    String sharding_key_str;
    ASTPtr sharding_key_ast;
-    ASTPtr engine_split_ast;
+    ASTPtr main_engine_split_ast;
    /*
     * To copy partiton piece form one cluster to another we have to use Distributed table.
     * In case of usage separate table (engine_push) for each partiton piece,
     * we have to use many Distributed tables.
     * */
    ASTs auxiliary_engine_split_asts;
    /// Additional WHERE expression to filter input data
    String where_condition_str;
@ -62,10 +107,15 @@ struct TaskTable
    Strings enabled_partitions;
    NameSet enabled_partitions_set;
-    /// Prioritized list of shards
+    /**
     * Prioritized list of shards
     * all_shards contains information about all shards in the table.
     * So we have to check whether particular shard have current partiton or not while processing.
     */
    TasksShard all_shards;
    TasksShard local_shards;
    /// All partitions of the current table.
    ClusterPartitions cluster_partitions;
    NameSet finished_cluster_partitions;
@ -76,7 +126,8 @@ struct TaskTable
    {
        auto it = cluster_partitions.find(partition_name);
        if (it == cluster_partitions.end())
-            throw Exception("There are no cluster partition " + partition_name + " in " + table_id, ErrorCodes::LOGICAL_ERROR);
+            throw Exception("There are no cluster partition " + partition_name + " in " + table_id,
                            ErrorCodes::LOGICAL_ERROR);
        return it->second;
    }
@ -85,13 +136,16 @@ struct TaskTable
    UInt64 rows_copied = 0;
    template <typename RandomEngine>
-    void initShards(RandomEngine && random_engine);
+    void initShards(RandomEngine &&random_engine);
 };
 struct TaskShard
 {
-    TaskShard(TaskTable &parent, const ShardInfo &info_) : task_table(parent), info(info_) {}
+    TaskShard(TaskTable & parent, const ShardInfo & info_) : task_table(parent), info(info_)
    {
        list_of_split_tables_on_shard.assign(task_table.number_of_splits, DatabaseAndTableName());
    }
    TaskTable & task_table;
@ -123,7 +177,8 @@ struct TaskShard
    /// Internal distributed tables
    DatabaseAndTableName table_read_shard;
-    DatabaseAndTableName table_split_shard;
+    DatabaseAndTableName main_table_split_shard;
    ListOfDatabasesAndTableNames list_of_split_tables_on_shard;
 };
@ -134,29 +189,62 @@ inline String TaskTable::getPartitionPath(const String & partition_name) const
           + "/" + escapeForFileName(partition_name);   // 201701
 }
-inline String TaskTable::getPartitionIsDirtyPath(const String & partition_name) const
+inline String TaskTable::getPartitionAttachIsActivePath(const String & partition_name) const
 {
    return getPartitionPath(partition_name) + "/attach_active";
 }
 inline String TaskTable::getPartitionAttachIsDonePath(const String & partition_name) const
 {
    return getPartitionPath(partition_name) + "/attach_is_done";
 }
 inline String TaskTable::getPartitionPiecePath(const String & partition_name, size_t piece_number) const
 {
    assert(piece_number < number_of_splits);
    return getPartitionPath(partition_name) + "/piece_" + toString(piece_number);  // 1...number_of_splits
 }
 inline String TaskTable::getCertainPartitionIsDirtyPath(const String &partition_name) const
 {
    return getPartitionPath(partition_name) + "/is_dirty";
 }
-inline String TaskTable::getPartitionIsCleanedPath(const String & partition_name) const
+inline String TaskTable::getCertainPartitionPieceIsDirtyPath(const String & partition_name, const size_t piece_number) const
 {
-    return getPartitionIsDirtyPath(partition_name) + "/cleaned";
+    return getPartitionPiecePath(partition_name, piece_number) + "/is_dirty";
 }
-inline String TaskTable::getPartitionTaskStatusPath(const String & partition_name) const
+inline String TaskTable::getCertainPartitionIsCleanedPath(const String & partition_name) const
 {
    return getCertainPartitionIsDirtyPath(partition_name) + "/cleaned";
 }
 inline String TaskTable::getCertainPartitionPieceIsCleanedPath(const String & partition_name, const size_t piece_number) const
 {
    return getCertainPartitionPieceIsDirtyPath(partition_name, piece_number) + "/cleaned";
 }
 inline String TaskTable::getCertainPartitionTaskStatusPath(const String & partition_name) const
 {
    return getPartitionPath(partition_name) + "/shards";
 }
-inline TaskTable::TaskTable(TaskCluster & parent, const Poco::Util::AbstractConfiguration & config, const String & prefix_,
+inline String TaskTable::getCertainPartitionPieceTaskStatusPath(const String & partition_name, const size_t piece_number) const
-                     const String & table_key)
+{
    return getPartitionPiecePath(partition_name, piece_number) + "/shards";
 }
 inline TaskTable::TaskTable(TaskCluster & parent, const Poco::Util::AbstractConfiguration & config,
                     const String & prefix_, const String & table_key)
        : task_cluster(parent)
 {
    String table_prefix = prefix_ + "." + table_key + ".";
    name_in_config = table_key;
    number_of_splits = config.getUInt64(table_prefix + "number_of_splits", 10);
    cluster_pull_name = config.getString(table_prefix + "cluster_pull");
    cluster_push_name = config.getString(table_prefix + "cluster_push");
@ -176,13 +264,27 @@ inline TaskTable::TaskTable(TaskCluster & parent, const Poco::Util::AbstractConf
        ParserStorage parser_storage;
        engine_push_ast = parseQuery(parser_storage, engine_push_str, 0);
        engine_push_partition_key_ast = extractPartitionKey(engine_push_ast);
        primary_key_comma_separated = createCommaSeparatedStringFrom(extractPrimaryKeyColumnNames(engine_push_ast));
        engine_push_zk_path = extractReplicatedTableZookeeperPath(engine_push_ast);
    }
    sharding_key_str = config.getString(table_prefix + "sharding_key");
    auxiliary_engine_split_asts.reserve(number_of_splits);
    {
        ParserExpressionWithOptionalAlias parser_expression(false);
        sharding_key_ast = parseQuery(parser_expression, sharding_key_str, 0);
-        engine_split_ast = createASTStorageDistributed(cluster_push_name, table_push.first, table_push.second, sharding_key_ast);
+        main_engine_split_ast = createASTStorageDistributed(cluster_push_name, table_push.first, table_push.second,
                                                            sharding_key_ast);
        for (const auto piece_number : ext::range(0, number_of_splits))
        {
            auxiliary_engine_split_asts.emplace_back
                    (
                            createASTStorageDistributed(cluster_push_name, table_push.first,
                                                        table_push.second + "_piece_" + toString(piece_number), sharding_key_ast)
                    );
        }
    }
    where_condition_str = config.getString(table_prefix + "where_condition", "");
@ -213,7 +315,7 @@ inline TaskTable::TaskTable(TaskCluster & parent, const Poco::Util::AbstractConf
        else
        {
            /// Parse sequence of <partition>...</partition>
-            for (const String & key : keys)
+            for (const String &key : keys)
            {
                if (!startsWith(key, "partition"))
                    throw Exception("Unknown key " + key + " in " + enabled_partitions_prefix, ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG);
@ -259,6 +361,25 @@ inline void TaskTable::initShards(RandomEngine && random_engine)
    local_shards.assign(all_shards.begin(), it_first_remote);
 }
 inline ASTPtr TaskTable::rewriteReplicatedCreateQueryToPlain()
 {
    ASTPtr prev_engine_push_ast = engine_push_ast->clone();
    auto & new_storage_ast = prev_engine_push_ast->as<ASTStorage &>();
    auto & new_engine_ast = new_storage_ast.engine->as<ASTFunction &>();
    auto & replicated_table_arguments = new_engine_ast.arguments->children;
    /// Delete first two arguments of Replicated...MergeTree() table.
    replicated_table_arguments.erase(replicated_table_arguments.begin());
    replicated_table_arguments.erase(replicated_table_arguments.begin());
    /// Remove replicated from name
    new_engine_ast.name = new_engine_ast.name.substr(10);
    return new_storage_ast.clone();
 }
 inline String DB::TaskShard::getDescription() const
 {
@ -272,7 +393,7 @@ inline String DB::TaskShard::getDescription() const
 inline String DB::TaskShard::getHostNameExample() const
 {
-    auto &replicas = task_table.cluster_pull->getShardsAddresses().at(indexInCluster());
+    auto & replicas = task_table.cluster_pull->getShardsAddresses().at(indexInCluster());
    return replicas.at(0).readableString();
 }
--- a/dbms/programs/copier/ZooKeeperStaff.h
+++ b/dbms/programs/copier/ZooKeeperStaff.h
@ -157,11 +157,8 @@ public:
    bool is_clean() const
    {
-        return
+        return !is_stale()
-                !is_stale()
+            && (!discovery_zxid.hasHappened() || (clean_state_zxid.hasHappened() && discovery_zxid <= clean_state_zxid));
                && (
                        !discovery_zxid.hasHappened()
                        || (clean_state_zxid.hasHappened() && discovery_zxid <= clean_state_zxid));
    }
    bool is_stale() const
--- a/dbms/programs/local/LocalServer.cpp
+++ b/dbms/programs/local/LocalServer.cpp
@ -148,7 +148,6 @@ try
        return Application::EXIT_OK;
    }
    context = std::make_unique<Context>(Context::createGlobal());
    context->makeGlobalContext();
    context->setApplicationType(Context::ApplicationType::LOCAL);
@ -180,7 +179,7 @@ try
    setupUsers();
    /// Limit on total number of concurrently executing queries.
-    /// There is no need for concurrent threads, override max_concurrent_queries.
+    /// There is no need for concurrent queries, override max_concurrent_queries.
    context->getProcessList().setMaxSize(0);
    /// Size of cache for uncompressed blocks. Zero means disabled.
--- a/dbms/programs/main.cpp
+++ b/dbms/programs/main.cpp
@ -1,3 +1,7 @@
 #include <signal.h>
 #include <setjmp.h>
 #include <unistd.h>
 #include <new>
 #include <iostream>
 #include <vector>
@ -118,6 +122,159 @@ bool isClickhouseApp(const std::string & app_suffix, std::vector<char *> & argv)
    return !argv.empty() && (app_name == argv[0] || endsWith(argv[0], "/" + app_name));
 }
 enum class InstructionFail
 {
    NONE = 0,
    SSE3 = 1,
    SSSE3 = 2,
    SSE4_1 = 3,
    SSE4_2 = 4,
    AVX = 5,
    AVX2 = 6,
    AVX512 = 7
 };
 const char * instructionFailToString(InstructionFail fail)
 {
    switch (fail)
    {
        case InstructionFail::NONE:
            return "NONE";
        case InstructionFail::SSE3:
            return "SSE3";
        case InstructionFail::SSSE3:
            return "SSSE3";
        case InstructionFail::SSE4_1:
            return "SSE4.1";
        case InstructionFail::SSE4_2:
            return "SSE4.2";
        case InstructionFail::AVX:
            return "AVX";
        case InstructionFail::AVX2:
            return "AVX2";
        case InstructionFail::AVX512:
            return "AVX512";
    }
    __builtin_unreachable();
 }
 sigjmp_buf jmpbuf;
 [[noreturn]] void sigIllCheckHandler(int, siginfo_t *, void *)
 {
    siglongjmp(jmpbuf, 1);
 }
 /// Check if necessary SSE extensions are available by trying to execute some sse instructions.
 /// If instruction is unavailable, SIGILL will be sent by kernel.
 void checkRequiredInstructionsImpl(volatile InstructionFail & fail)
 {
 #if defined(__SSE3__)
    fail = InstructionFail::SSE3;
    __asm__ volatile ("addsubpd %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if defined(__SSSE3__)
    fail = InstructionFail::SSSE3;
    __asm__ volatile ("pabsw %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if defined(__SSE4_1__)
    fail = InstructionFail::SSE4_1;
    __asm__ volatile ("pmaxud %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if defined(__SSE4_2__)
    fail = InstructionFail::SSE4_2;
    __asm__ volatile ("pcmpgtq %%xmm0, %%xmm0" : : : "xmm0");
 #endif
 #if defined(__AVX__)
    fail = InstructionFail::AVX;
    __asm__ volatile ("vaddpd %%ymm0, %%ymm0, %%ymm0" : : : "ymm0");
 #endif
 #if defined(__AVX2__)
    fail = InstructionFail::AVX2;
    __asm__ volatile ("vpabsw %%ymm0, %%ymm0" : : : "ymm0");
 #endif
 #if defined(__AVX512__)
    fail = InstructionFail::AVX512;
    __asm__ volatile ("vpabsw %%zmm0, %%zmm0" : : : "zmm0");
 #endif
    fail = InstructionFail::NONE;
 }
 /// This function is safe to use in static initializers.
 void writeError(const char * data, size_t size)
 {
    while (size != 0)
    {
        ssize_t res = ::write(STDERR_FILENO, data, size);
        if ((-1 == res || 0 == res) && errno != EINTR)
            _Exit(1);
        if (res > 0)
        {
            data += res;
            size -= res;
        }
    }
 }
 /// Check SSE and others instructions availability. Calls exit on fail.
 /// This function must be called as early as possible, even before main, because static initializers may use unavailable instructions.
 void checkRequiredInstructions()
 {
    struct sigaction sa{};
    struct sigaction sa_old{};
    sa.sa_sigaction = sigIllCheckHandler;
    sa.sa_flags = SA_SIGINFO;
    auto signal = SIGILL;
    if (sigemptyset(&sa.sa_mask) != 0
        || sigaddset(&sa.sa_mask, signal) != 0
        || sigaction(signal, &sa, &sa_old) != 0)
    {
        /// You may wonder about strlen.
        /// Typical implementation of strlen is using SSE4.2 or AVX2.
        /// But this is not the case because it's compiler builtin and is executed at compile time.
        const char * msg = "Can not set signal handler\n";
        writeError(msg, strlen(msg));
        _Exit(1);
    }
    volatile InstructionFail fail = InstructionFail::NONE;
    if (sigsetjmp(jmpbuf, 1))
    {
        const char * msg1 = "Instruction check fail. The CPU does not support ";
        writeError(msg1, strlen(msg1));
        const char * msg2 = instructionFailToString(fail);
        writeError(msg2, strlen(msg2));
        const char * msg3 = " instruction set.\n";
        writeError(msg3, strlen(msg3));
        _Exit(1);
    }
    checkRequiredInstructionsImpl(fail);
    if (sigaction(signal, &sa_old, nullptr))
    {
        const char * msg = "Can not set signal handler\n";
        writeError(msg, strlen(msg));
        _Exit(1);
    }
 }
 struct Checker { Checker() { checkRequiredInstructions(); } } checker;
 }
--- a/dbms/src/Core/Settings.h
+++ b/dbms/src/Core/Settings.h
@ -249,6 +249,10 @@ struct Settings : public SettingsCollection<Settings>
    M(SettingString, format_custom_result_before_delimiter, "", "Prefix before result set (for CustomSeparated format)", 0) \
    M(SettingString, format_custom_result_after_delimiter, "", "Suffix after result set (for CustomSeparated format)", 0) \
    \
    M(SettingString, format_regexp, "", "Regular expression (for Regexp format)", 0) \
    M(SettingString, format_regexp_escaping_rule, "Escaped", "Field escaping rule (for Regexp format)", 0) \
    M(SettingBool, format_regexp_skip_unmatched, false, "Skip lines unmatched by regular expression (for Regexp format", 0) \
    \
    M(SettingBool, insert_allow_materialized_columns, 0, "If setting is enabled, Allow materialized columns in INSERT.", 0) \
    M(SettingSeconds, http_connection_timeout, DEFAULT_HTTP_READ_BUFFER_CONNECTION_TIMEOUT, "HTTP connection timeout.", 0) \
    M(SettingSeconds, http_send_timeout, DEFAULT_HTTP_READ_BUFFER_TIMEOUT, "HTTP send timeout", 0) \
--- a/dbms/src/Core/SettingsCollection.h
+++ b/dbms/src/Core/SettingsCollection.h
@ -352,6 +352,7 @@ private:
        StringRef name;
        StringRef description;
        StringRef type;
        bool is_important;
        IsChangedFunction is_changed;
        GetStringFunction get_string;
@ -398,6 +399,7 @@ public:
        const_reference(const const_reference & src) = default;
        const StringRef & getName() const { return member->name; }
        const StringRef & getDescription() const { return member->description; }
        const StringRef & getType() const { return member->type; }
        bool isChanged() const { return member->is_changed(*collection); }
        Field getValue() const;
        String getValueAsString() const { return member->get_string(*collection); }
--- a/dbms/src/Core/SettingsCollectionImpl.h
+++ b/dbms/src/Core/SettingsCollectionImpl.h
@ -323,7 +323,9 @@ void SettingsCollection<Derived>::deserialize(ReadBuffer & buf, SettingsBinaryFo
 #define IMPLEMENT_SETTINGS_COLLECTION_ADD_MEMBER_INFO_HELPER_(TYPE, NAME, DEFAULT, DESCRIPTION, FLAGS) \
-    add({StringRef(#NAME, strlen(#NAME)), StringRef(DESCRIPTION, strlen(DESCRIPTION)), \
+    add({StringRef(#NAME, strlen(#NAME)), \
         StringRef(DESCRIPTION, strlen(DESCRIPTION)), \
         StringRef(#TYPE, strlen(#TYPE)), \
         FLAGS & IMPORTANT, \
         [](const Derived & d) { return d.NAME.changed; }, \
         &Functions::NAME##_getString, &Functions::NAME##_getField, \
--- a/dbms/src/DataStreams/PushingToViewsBlockOutputStream.cpp
+++ b/dbms/src/DataStreams/PushingToViewsBlockOutputStream.cpp
@ -25,7 +25,7 @@ PushingToViewsBlockOutputStream::PushingToViewsBlockOutputStream(
      * Although now any insertion into the table is done via PushingToViewsBlockOutputStream,
      *  but it's clear that here is not the best place for this functionality.
      */
-    addTableLock(storage->lockStructureForShare(true, context.getInitialQueryId()));
+    addTableLock(storage->lockStructureForShare(context.getInitialQueryId()));
    /// If the "root" table deduplactes blocks, there are no need to make deduplication for children
    /// Moreover, deduplication for AggregatingMergeTree children could produce false positives due to low size of inserting blocks
@ -54,7 +54,7 @@ PushingToViewsBlockOutputStream::PushingToViewsBlockOutputStream(
        if (auto * materialized_view = dynamic_cast<StorageMaterializedView *>(dependent_table.get()))
        {
-            addTableLock(materialized_view->lockStructureForShare(true, context.getInitialQueryId()));
+            addTableLock(materialized_view->lockStructureForShare(context.getInitialQueryId()));
            StoragePtr inner_table = materialized_view->getTargetTable();
            auto inner_table_id = inner_table->getStorageID();
--- a/dbms/src/Databases/DatabaseMySQL.cpp
+++ b/dbms/src/Databases/DatabaseMySQL.cpp
@ -358,7 +358,7 @@ void DatabaseMySQL::cleanOutdatedTables()
                ++iterator;
            else
            {
-                const auto table_lock = (*iterator)->lockAlterIntention(RWLockImpl::NO_QUERY);
+                const auto table_lock = (*iterator)->lockAlterIntention();
                (*iterator)->shutdown();
                (*iterator)->is_dropped = true;
--- a/dbms/src/Formats/FormatFactory.cpp
+++ b/dbms/src/Formats/FormatFactory.cpp
@ -68,6 +68,9 @@ static FormatSettings getInputFormatSetting(const Settings & settings, const Con
    format_settings.custom.row_before_delimiter = settings.format_custom_row_before_delimiter;
    format_settings.custom.row_after_delimiter = settings.format_custom_row_after_delimiter;
    format_settings.custom.row_between_delimiter = settings.format_custom_row_between_delimiter;
    format_settings.regexp.regexp = settings.format_regexp;
    format_settings.regexp.escaping_rule = settings.format_regexp_escaping_rule;
    format_settings.regexp.skip_unmatched = settings.format_regexp_skip_unmatched;
    /// Validate avro_schema_registry_url with RemoteHostFilter when non-empty and in Server context
    if (context.hasGlobalContext() && (context.getGlobalContext().getApplicationType() == Context::ApplicationType::SERVER))
@ -352,10 +355,12 @@ FormatFactory::FormatFactory()
    registerOutputFormatProcessorAvro(*this);
    registerInputFormatProcessorTemplate(*this);
    registerOutputFormatProcessorTemplate(*this);
    registerInputFormatProcessorRegexp(*this);
    registerFileSegmentationEngineTabSeparated(*this);
    registerFileSegmentationEngineCSV(*this);
    registerFileSegmentationEngineJSONEachRow(*this);
    registerFileSegmentationEngineRegexp(*this);
    registerOutputFormatNull(*this);
--- a/dbms/src/Formats/FormatFactory.h
+++ b/dbms/src/Formats/FormatFactory.h
@ -178,6 +178,7 @@ void registerOutputFormatProcessorTemplate(FormatFactory &factory);
 void registerFileSegmentationEngineTabSeparated(FormatFactory & factory);
 void registerFileSegmentationEngineCSV(FormatFactory & factory);
 void registerFileSegmentationEngineJSONEachRow(FormatFactory & factory);
 void registerFileSegmentationEngineRegexp(FormatFactory & factory);
 /// Output only (presentational) formats.
@ -198,5 +199,6 @@ void registerOutputFormatProcessorMySQLWrite(FormatFactory & factory);
 /// Input only formats.
 void registerInputFormatProcessorCapnProto(FormatFactory & factory);
 void registerInputFormatProcessorRegexp(FormatFactory & factory);
 }
--- a/dbms/src/Formats/FormatSettings.h
+++ b/dbms/src/Formats/FormatSettings.h
@ -122,6 +122,15 @@ struct FormatSettings
    Avro avro;
    struct Regexp
    {
        std::string regexp;
        std::string escaping_rule;
        bool skip_unmatched = false;
    };
    Regexp regexp;
 };
 }
--- a/dbms/src/Functions/FunctionJoinGet.cpp
+++ b/dbms/src/Functions/FunctionJoinGet.cpp
@ -65,7 +65,7 @@ FunctionBaseImplPtr JoinGetOverloadResolver::build(const ColumnsWithTypeAndName
    auto join = storage_join->getJoin();
    DataTypes data_types(arguments.size());
-    auto table_lock = storage_join->lockStructureForShare(false, context.getInitialQueryId());
+    auto table_lock = storage_join->lockStructureForShare(context.getInitialQueryId());
    for (size_t i = 0; i < arguments.size(); ++i)
        data_types[i] = arguments[i].type;
--- a/dbms/src/Functions/FunctionsMultiStringPosition.h
+++ b/dbms/src/Functions/FunctionsMultiStringPosition.h
@ -0,0 +1,129 @@
 #pragma once
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnVector.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunctionImpl.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Context.h>
 #include <common/StringRef.h>
 namespace DB
 {
 /** multiSearchAllPositions(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- find first occurrences (positions) of all the const patterns inside haystack
  * multiSearchAllPositionsUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAllPositionsCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAllPositionsCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  *
  * multiSearchFirstPosition(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- returns the first position of the haystack matched by strings or zero if nothing was found
  * multiSearchFirstPositionUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstPositionCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstPositionCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  *
  * multiSearchAny(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- find any of the const patterns inside haystack and return 0 or 1
  * multiSearchAnyUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAnyCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAnyCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndex(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- returns the first index of the matched string or zero if nothing was found
  * multiSearchFirstIndexUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndexCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndexCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  */
 namespace ErrorCodes
 {
    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
    extern const int ILLEGAL_COLUMN;
    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 template <typename Impl, typename Name>
 class FunctionsMultiStringPosition : public IFunction
 {
 public:
    static constexpr auto name = Name::name;
    static FunctionPtr create(const Context &) { return std::make_shared<FunctionsMultiStringPosition>(); }
    String getName() const override { return name; }
    size_t getNumberOfArguments() const override { return 2; }
    bool useDefaultImplementationForConstants() const override { return true; }
    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
        if (!isString(arguments[0]))
            throw Exception(
                "Illegal type " + arguments[0]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(arguments[1].get());
        if (!array_type || !checkAndGetDataType<DataTypeString>(array_type->getNestedType().get()))
            throw Exception(
                "Illegal type " + arguments[1]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        return std::make_shared<DataTypeArray>(std::make_shared<DataTypeUInt64>());
    }
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) override
    {
        using ResultType = typename Impl::ResultType;
        const ColumnPtr & column_haystack = block.getByPosition(arguments[0]).column;
        const ColumnString * col_haystack_vector = checkAndGetColumn<ColumnString>(&*column_haystack);
        const ColumnPtr & arr_ptr = block.getByPosition(arguments[1]).column;
        const ColumnConst * col_const_arr = checkAndGetColumnConst<ColumnArray>(arr_ptr.get());
        if (!col_const_arr)
            throw Exception(
                "Illegal column " + block.getByPosition(arguments[1]).column->getName() + ". The array is not const",
                ErrorCodes::ILLEGAL_COLUMN);
        Array src_arr = col_const_arr->getValue<Array>();
        if (src_arr.size() > std::numeric_limits<UInt8>::max())
            throw Exception(
                "Number of arguments for function " + getName() + " doesn't match: passed " + std::to_string(src_arr.size())
                    + ", should be at most 255",
                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
        std::vector<StringRef> refs;
        for (const auto & el : src_arr)
            refs.emplace_back(el.get<String>());
        const size_t column_haystack_size = column_haystack->size();
        auto col_res = ColumnVector<ResultType>::create();
        auto col_offsets = ColumnArray::ColumnOffsets::create(column_haystack_size);
        auto & vec_res = col_res->getData();
        auto & offsets_res = col_offsets->getData();
        vec_res.resize(column_haystack_size * refs.size());
        if (col_haystack_vector)
            Impl::vectorConstant(col_haystack_vector->getChars(), col_haystack_vector->getOffsets(), refs, vec_res);
        else
            throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName(), ErrorCodes::ILLEGAL_COLUMN);
        size_t refs_size = refs.size();
        size_t accum = refs_size;
        for (size_t i = 0; i < column_haystack_size; ++i, accum += refs_size)
            offsets_res[i] = accum;
        block.getByPosition(result).column = ColumnArray::create(std::move(col_res), std::move(col_offsets));
    }
 };
 }
--- a/dbms/src/Functions/FunctionsMultiStringSearch.h
+++ b/dbms/src/Functions/FunctionsMultiStringSearch.h
@ -0,0 +1,127 @@
 #pragma once
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnVector.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunctionImpl.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Context.h>
 #include <common/StringRef.h>
 namespace DB
 {
 /**
  * multiSearchAny(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- find any of the const patterns inside haystack and return 0 or 1
  * multiSearchAnyUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAnyCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAnyCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndex(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- returns the first index of the matched string or zero if nothing was found
  * multiSearchFirstIndexUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndexCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndexCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  */
 namespace ErrorCodes
 {
    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
    extern const int ILLEGAL_COLUMN;
    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
    extern const int FUNCTION_NOT_ALLOWED;
 }
 /// The argument limiting raises from Volnitsky searcher -- it is performance crucial to save only one byte for pattern number.
 /// But some other searchers use this function, for example, multiMatchAny -- hyperscan does not have such restrictions
 template <typename Impl, typename Name, size_t LimitArgs = std::numeric_limits<UInt8>::max()>
 class FunctionsMultiStringSearch : public IFunction
 {
    static_assert(LimitArgs > 0);
 public:
    static constexpr auto name = Name::name;
    static FunctionPtr create(const Context & context)
    {
        if (Impl::is_using_hyperscan && !context.getSettingsRef().allow_hyperscan)
            throw Exception(
                "Hyperscan functions are disabled, because setting 'allow_hyperscan' is set to 0", ErrorCodes::FUNCTION_NOT_ALLOWED);
        return std::make_shared<FunctionsMultiStringSearch>();
    }
    String getName() const override { return name; }
    size_t getNumberOfArguments() const override { return 2; }
    bool useDefaultImplementationForConstants() const override { return true; }
    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
        if (!isString(arguments[0]))
            throw Exception(
                "Illegal type " + arguments[0]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(arguments[1].get());
        if (!array_type || !checkAndGetDataType<DataTypeString>(array_type->getNestedType().get()))
            throw Exception(
                "Illegal type " + arguments[1]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        return Impl::getReturnType();
    }
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) override
    {
        using ResultType = typename Impl::ResultType;
        const ColumnPtr & column_haystack = block.getByPosition(arguments[0]).column;
        const ColumnString * col_haystack_vector = checkAndGetColumn<ColumnString>(&*column_haystack);
        const ColumnPtr & arr_ptr = block.getByPosition(arguments[1]).column;
        const ColumnConst * col_const_arr = checkAndGetColumnConst<ColumnArray>(arr_ptr.get());
        if (!col_const_arr)
            throw Exception(
                "Illegal column " + block.getByPosition(arguments[1]).column->getName() + ". The array is not const",
                ErrorCodes::ILLEGAL_COLUMN);
        Array src_arr = col_const_arr->getValue<Array>();
        if (src_arr.size() > LimitArgs)
            throw Exception(
                "Number of arguments for function " + getName() + " doesn't match: passed " + std::to_string(src_arr.size())
                    + ", should be at most " + std::to_string(LimitArgs),
                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
        std::vector<StringRef> refs;
        refs.reserve(src_arr.size());
        for (const auto & el : src_arr)
            refs.emplace_back(el.get<String>());
        auto col_res = ColumnVector<ResultType>::create();
        auto col_offsets = ColumnArray::ColumnOffsets::create();
        auto & vec_res = col_res->getData();
        auto & offsets_res = col_offsets->getData();
        /// The blame for resizing output is for the callee.
        if (col_haystack_vector)
            Impl::vectorConstant(col_haystack_vector->getChars(), col_haystack_vector->getOffsets(), refs, vec_res, offsets_res);
        else
            throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName(), ErrorCodes::ILLEGAL_COLUMN);
        if constexpr (Impl::is_column_array)
            block.getByPosition(result).column = ColumnArray::create(std::move(col_res), std::move(col_offsets));
        else
            block.getByPosition(result).column = std::move(col_res);
    }
 };
 }
--- a/dbms/src/Functions/FunctionsStringRegex.cpp
+++ b/dbms/src/Functions/FunctionsStringRegex.cpp
@ -1,5 +1,7 @@
 #include "FunctionsStringRegex.h"
 #include "FunctionsStringSearch.h"
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionsStringSearchToString.h"
 #include <Columns/ColumnFixedString.h>
 #include <DataTypes/DataTypeFixedString.h>
 #include <Functions/FunctionFactory.h>
--- a/dbms/src/Functions/FunctionsStringSearch.cpp
+++ b/dbms/src/Functions/FunctionsStringSearch.cpp
@ -1,707 +0,0 @@
 #include "FunctionsStringSearch.h"
 #include <algorithm>
 #include <memory>
 #include <string>
 #include <vector>
 #include <Columns/ColumnFixedString.h>
 #include <DataTypes/DataTypeFixedString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/Regexps.h>
 #include <IO/WriteHelpers.h>
 #include <Poco/UTF8String.h>
 #include <Common/Volnitsky.h>
 namespace DB
 {
 namespace ErrorCodes
 {
    extern const int ILLEGAL_COLUMN;
 }
 /** Implementation details for functions of 'position' family depending on ASCII/UTF8 and case sensitiveness.
  */
 struct PositionCaseSensitiveASCII
 {
    /// For searching single substring inside big-enough contiguous chunk of data. Coluld have slightly expensive initialization.
    using SearcherInBigHaystack = Volnitsky;
    /// For search many substrings in one string
    using MultiSearcherInBigHaystack = MultiVolnitsky;
    /// For searching single substring, that is different each time. This object is created for each row of data. It must have cheap initialization.
    using SearcherInSmallHaystack = LibCASCIICaseSensitiveStringSearcher;
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t haystack_size_hint)
    {
        return SearcherInBigHaystack(needle_data, needle_size, haystack_size_hint);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    /// Number of code points between 'begin' and 'end' (this has different behaviour for ASCII and UTF-8).
    static size_t countChars(const char * begin, const char * end) { return end - begin; }
    /// Convert string to lowercase. Only for case-insensitive search.
    /// Implementation is permitted to be inefficient because it is called for single string.
    static void toLowerIfNeed(std::string &) { }
 };
 struct PositionCaseInsensitiveASCII
 {
    /// `Volnitsky` is not used here, because one person has measured that this is better. It will be good if you question it.
    using SearcherInBigHaystack = ASCIICaseInsensitiveStringSearcher;
    using MultiSearcherInBigHaystack = MultiVolnitskyCaseInsensitive;
    using SearcherInSmallHaystack = LibCASCIICaseInsensitiveStringSearcher;
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t /*haystack_size_hint*/)
    {
        return SearcherInBigHaystack(needle_data, needle_size);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    static size_t countChars(const char * begin, const char * end) { return end - begin; }
    static void toLowerIfNeed(std::string & s) { std::transform(std::begin(s), std::end(s), std::begin(s), tolower); }
 };
 struct PositionCaseSensitiveUTF8
 {
    using SearcherInBigHaystack = VolnitskyUTF8;
    using MultiSearcherInBigHaystack = MultiVolnitskyUTF8;
    using SearcherInSmallHaystack = LibCASCIICaseSensitiveStringSearcher;
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t haystack_size_hint)
    {
        return SearcherInBigHaystack(needle_data, needle_size, haystack_size_hint);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    static size_t countChars(const char * begin, const char * end)
    {
        size_t res = 0;
        for (auto it = begin; it != end; ++it)
            if (!UTF8::isContinuationOctet(static_cast<UInt8>(*it)))
                ++res;
        return res;
    }
    static void toLowerIfNeed(std::string &) { }
 };
 struct PositionCaseInsensitiveUTF8
 {
    using SearcherInBigHaystack = VolnitskyCaseInsensitiveUTF8;
    using MultiSearcherInBigHaystack = MultiVolnitskyCaseInsensitiveUTF8;
    using SearcherInSmallHaystack = UTF8CaseInsensitiveStringSearcher; /// TODO Very suboptimal.
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t haystack_size_hint)
    {
        return SearcherInBigHaystack(needle_data, needle_size, haystack_size_hint);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    static size_t countChars(const char * begin, const char * end)
    {
        size_t res = 0;
        for (auto it = begin; it != end; ++it)
            if (!UTF8::isContinuationOctet(static_cast<UInt8>(*it)))
                ++res;
        return res;
    }
    static void toLowerIfNeed(std::string & s) { Poco::UTF8::toLowerInPlace(s); }
 };
 template <typename Impl>
 struct PositionImpl
 {
    static constexpr bool use_default_implementation_for_constants = false;
    using ResultType = UInt64;
    /// Find one substring in many strings.
    static void vectorConstant(
        const ColumnString::Chars & data, const ColumnString::Offsets & offsets, const std::string & needle, PaddedPODArray<UInt64> & res)
    {
        const UInt8 * begin = data.data();
        const UInt8 * pos = begin;
        const UInt8 * end = pos + data.size();
        /// Current index in the array of strings.
        size_t i = 0;
        typename Impl::SearcherInBigHaystack searcher = Impl::createSearcherInBigHaystack(needle.data(), needle.size(), end - pos);
        /// We will search for the next occurrence in all strings at once.
        while (pos < end && end != (pos = searcher.search(pos, end - pos)))
        {
            /// Determine which index it refers to.
            while (begin + offsets[i] <= pos)
            {
                res[i] = 0;
                ++i;
            }
            /// We check that the entry does not pass through the boundaries of strings.
            if (pos + needle.size() < begin + offsets[i])
                res[i] = 1 + Impl::countChars(reinterpret_cast<const char *>(begin + offsets[i - 1]), reinterpret_cast<const char *>(pos));
            else
                res[i] = 0;
            pos = begin + offsets[i];
            ++i;
        }
        if (i < res.size())
            memset(&res[i], 0, (res.size() - i) * sizeof(res[0]));
    }
    /// Search for substring in string.
    static void constantConstant(std::string data, std::string needle, UInt64 & res)
    {
        Impl::toLowerIfNeed(data);
        Impl::toLowerIfNeed(needle);
        res = data.find(needle);
        if (res == std::string::npos)
            res = 0;
        else
            res = 1 + Impl::countChars(data.data(), data.data() + res);
    }
    /// Search each time for a different single substring inside each time different string.
    static void vectorVector(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const ColumnString::Chars & needle_data,
        const ColumnString::Offsets & needle_offsets,
        PaddedPODArray<UInt64> & res)
    {
        ColumnString::Offset prev_haystack_offset = 0;
        ColumnString::Offset prev_needle_offset = 0;
        size_t size = haystack_offsets.size();
        for (size_t i = 0; i < size; ++i)
        {
            size_t needle_size = needle_offsets[i] - prev_needle_offset - 1;
            size_t haystack_size = haystack_offsets[i] - prev_haystack_offset - 1;
            if (0 == needle_size)
            {
                /// An empty string is always at the very beginning of `haystack`.
                res[i] = 1;
            }
            else
            {
                /// It is assumed that the StringSearcher is not very difficult to initialize.
                typename Impl::SearcherInSmallHaystack searcher = Impl::createSearcherInSmallHaystack(
                    reinterpret_cast<const char *>(&needle_data[prev_needle_offset]),
                    needle_offsets[i] - prev_needle_offset - 1); /// zero byte at the end
                /// searcher returns a pointer to the found substring or to the end of `haystack`.
                size_t pos = searcher.search(&haystack_data[prev_haystack_offset], &haystack_data[haystack_offsets[i] - 1])
                    - &haystack_data[prev_haystack_offset];
                if (pos != haystack_size)
                {
                    res[i] = 1
                        + Impl::countChars(
                                 reinterpret_cast<const char *>(&haystack_data[prev_haystack_offset]),
                                 reinterpret_cast<const char *>(&haystack_data[prev_haystack_offset + pos]));
                }
                else
                    res[i] = 0;
            }
            prev_haystack_offset = haystack_offsets[i];
            prev_needle_offset = needle_offsets[i];
        }
    }
    /// Find many substrings in single string.
    static void constantVector(
        const String & haystack,
        const ColumnString::Chars & needle_data,
        const ColumnString::Offsets & needle_offsets,
        PaddedPODArray<UInt64> & res)
    {
        // NOTE You could use haystack indexing. But this is a rare case.
        ColumnString::Offset prev_needle_offset = 0;
        size_t size = needle_offsets.size();
        for (size_t i = 0; i < size; ++i)
        {
            size_t needle_size = needle_offsets[i] - prev_needle_offset - 1;
            if (0 == needle_size)
            {
                res[i] = 1;
            }
            else
            {
                typename Impl::SearcherInSmallHaystack searcher = Impl::createSearcherInSmallHaystack(
                    reinterpret_cast<const char *>(&needle_data[prev_needle_offset]), needle_offsets[i] - prev_needle_offset - 1);
                size_t pos = searcher.search(
                                 reinterpret_cast<const UInt8 *>(haystack.data()),
                                 reinterpret_cast<const UInt8 *>(haystack.data()) + haystack.size())
                    - reinterpret_cast<const UInt8 *>(haystack.data());
                if (pos != haystack.size())
                {
                    res[i] = 1 + Impl::countChars(haystack.data(), haystack.data() + pos);
                }
                else
                    res[i] = 0;
            }
            prev_needle_offset = needle_offsets[i];
        }
    }
    template <typename... Args>
    static void vectorFixedConstant(Args &&...)
    {
        throw Exception("Functions 'position' don't support FixedString haystack argument", ErrorCodes::ILLEGAL_COLUMN);
    }
 };
 template <typename Impl>
 struct MultiSearchAllPositionsImpl
 {
    using ResultType = UInt64;
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt64> & res)
    {
        auto res_callback = [](const UInt8 * start, const UInt8 * end) -> UInt64
        {
            return 1 + Impl::countChars(reinterpret_cast<const char *>(start), reinterpret_cast<const char *>(end));
        };
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        const size_t needles_size = needles.size();
        /// Something can be uninitialized after the search itself
        std::fill(res.begin(), res.end(), 0);
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0, from = 0; j < haystack_string_size; ++j, from += needles_size)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                searcher.searchOneAll(haystack, haystack_end, res.data() + from, res_callback);
                prev_offset = haystack_offsets[j];
            }
        }
    }
 };
 template <typename Impl>
 struct MultiSearchImpl
 {
    using ResultType = UInt8;
    static constexpr bool is_using_hyperscan = false;
    /// Variable for understanding, if we used offsets for the output, most
    /// likely to determine whether the function returns ColumnVector of ColumnArray.
    static constexpr bool is_column_array = false;
    static auto getReturnType() { return std::make_shared<DataTypeNumber<ResultType>>(); }
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt8> & res,
        [[maybe_unused]] PaddedPODArray<UInt64> & offsets)
    {
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        res.resize(haystack_string_size);
        size_t iteration = 0;
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0; j < haystack_string_size; ++j)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                if (iteration == 0 || !res[j])
                    res[j] = searcher.searchOne(haystack, haystack_end);
                prev_offset = haystack_offsets[j];
            }
            ++iteration;
        }
    }
 };
 template <typename Impl>
 struct MultiSearchFirstPositionImpl
 {
    using ResultType = UInt64;
    static constexpr bool is_using_hyperscan = false;
    /// Variable for understanding, if we used offsets for the output, most
    /// likely to determine whether the function returns ColumnVector of ColumnArray.
    static constexpr bool is_column_array = false;
    static auto getReturnType() { return std::make_shared<DataTypeNumber<ResultType>>(); }
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt64> & res,
        [[maybe_unused]] PaddedPODArray<UInt64> & offsets)
    {
        auto res_callback = [](const UInt8 * start, const UInt8 * end) -> UInt64
        {
            return 1 + Impl::countChars(reinterpret_cast<const char *>(start), reinterpret_cast<const char *>(end));
        };
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        res.resize(haystack_string_size);
        size_t iteration = 0;
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0; j < haystack_string_size; ++j)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                if (iteration == 0 || res[j] == 0)
                    res[j] = searcher.searchOneFirstPosition(haystack, haystack_end, res_callback);
                else
                {
                    UInt64 result = searcher.searchOneFirstPosition(haystack, haystack_end, res_callback);
                    if (result != 0)
                        res[j] = std::min(result, res[j]);
                }
                prev_offset = haystack_offsets[j];
            }
            ++iteration;
        }
    }
 };
 template <typename Impl>
 struct MultiSearchFirstIndexImpl
 {
    using ResultType = UInt64;
    static constexpr bool is_using_hyperscan = false;
    /// Variable for understanding, if we used offsets for the output, most
    /// likely to determine whether the function returns ColumnVector of ColumnArray.
    static constexpr bool is_column_array = false;
    static auto getReturnType() { return std::make_shared<DataTypeNumber<ResultType>>(); }
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt64> & res,
        [[maybe_unused]] PaddedPODArray<UInt64> & offsets)
    {
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        res.resize(haystack_string_size);
        size_t iteration = 0;
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0; j < haystack_string_size; ++j)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                /// hasMoreToSearch traverse needles in increasing order
                if (iteration == 0 || res[j] == 0)
                    res[j] = searcher.searchOneFirstIndex(haystack, haystack_end);
                prev_offset = haystack_offsets[j];
            }
            ++iteration;
        }
    }
 };
 /** Token search the string, means that needle must be surrounded by some separator chars, like whitespace or puctuation.
  */
 template <typename TokenSearcher, bool negate_result = false>
 struct HasTokenImpl
 {
    using ResultType = UInt8;
    static constexpr bool use_default_implementation_for_constants = true;
    static void vectorConstant(
        const ColumnString::Chars & data, const ColumnString::Offsets & offsets, const std::string & pattern, PaddedPODArray<UInt8> & res)
    {
        if (offsets.empty())
            return;
        const UInt8 * begin = data.data();
        const UInt8 * pos = begin;
        const UInt8 * end = pos + data.size();
        /// The current index in the array of strings.
        size_t i = 0;
        TokenSearcher searcher(pattern.data(), pattern.size(), end - pos);
        /// We will search for the next occurrence in all rows at once.
        while (pos < end && end != (pos = searcher.search(pos, end - pos)))
        {
            /// Let's determine which index it refers to.
            while (begin + offsets[i] <= pos)
            {
                res[i] = negate_result;
                ++i;
            }
            /// We check that the entry does not pass through the boundaries of strings.
            if (pos + pattern.size() < begin + offsets[i])
                res[i] = !negate_result;
            else
                res[i] = negate_result;
            pos = begin + offsets[i];
            ++i;
        }
        /// Tail, in which there can be no substring.
        if (i < res.size())
            memset(&res[i], negate_result, (res.size() - i) * sizeof(res[0]));
    }
    template <typename... Args>
    static void vectorVector(Args &&...)
    {
        throw Exception("Function 'hasToken' does not support non-constant needle argument", ErrorCodes::ILLEGAL_COLUMN);
    }
    /// Search different needles in single haystack.
    template <typename... Args>
    static void constantVector(Args &&...)
    {
        throw Exception("Function 'hasToken' does not support non-constant needle argument", ErrorCodes::ILLEGAL_COLUMN);
    }
    template <typename... Args>
    static void vectorFixedConstant(Args &&...)
    {
        throw Exception("Functions 'hasToken' don't support FixedString haystack argument", ErrorCodes::ILLEGAL_COLUMN);
    }
 };
 struct NamePosition
 {
    static constexpr auto name = "position";
 };
 struct NamePositionUTF8
 {
    static constexpr auto name = "positionUTF8";
 };
 struct NamePositionCaseInsensitive
 {
    static constexpr auto name = "positionCaseInsensitive";
 };
 struct NamePositionCaseInsensitiveUTF8
 {
    static constexpr auto name = "positionCaseInsensitiveUTF8";
 };
 struct NameMultiSearchAllPositions
 {
    static constexpr auto name = "multiSearchAllPositions";
 };
 struct NameMultiSearchAllPositionsUTF8
 {
    static constexpr auto name = "multiSearchAllPositionsUTF8";
 };
 struct NameMultiSearchAllPositionsCaseInsensitive
 {
    static constexpr auto name = "multiSearchAllPositionsCaseInsensitive";
 };
 struct NameMultiSearchAllPositionsCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchAllPositionsCaseInsensitiveUTF8";
 };
 struct NameMultiSearchAny
 {
    static constexpr auto name = "multiSearchAny";
 };
 struct NameMultiSearchAnyUTF8
 {
    static constexpr auto name = "multiSearchAnyUTF8";
 };
 struct NameMultiSearchAnyCaseInsensitive
 {
    static constexpr auto name = "multiSearchAnyCaseInsensitive";
 };
 struct NameMultiSearchAnyCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchAnyCaseInsensitiveUTF8";
 };
 struct NameMultiSearchFirstIndex
 {
    static constexpr auto name = "multiSearchFirstIndex";
 };
 struct NameMultiSearchFirstIndexUTF8
 {
    static constexpr auto name = "multiSearchFirstIndexUTF8";
 };
 struct NameMultiSearchFirstIndexCaseInsensitive
 {
    static constexpr auto name = "multiSearchFirstIndexCaseInsensitive";
 };
 struct NameMultiSearchFirstIndexCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchFirstIndexCaseInsensitiveUTF8";
 };
 struct NameMultiSearchFirstPosition
 {
    static constexpr auto name = "multiSearchFirstPosition";
 };
 struct NameMultiSearchFirstPositionUTF8
 {
    static constexpr auto name = "multiSearchFirstPositionUTF8";
 };
 struct NameMultiSearchFirstPositionCaseInsensitive
 {
    static constexpr auto name = "multiSearchFirstPositionCaseInsensitive";
 };
 struct NameMultiSearchFirstPositionCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchFirstPositionCaseInsensitiveUTF8";
 };
 struct NameHasToken
 {
    static constexpr auto name = "hasToken";
 };
 struct NameHasTokenCaseInsensitive
 {
    static constexpr auto name = "hasTokenCaseInsensitive";
 };
 using FunctionPosition = FunctionsStringSearch<PositionImpl<PositionCaseSensitiveASCII>, NamePosition>;
 using FunctionPositionUTF8 = FunctionsStringSearch<PositionImpl<PositionCaseSensitiveUTF8>, NamePositionUTF8>;
 using FunctionPositionCaseInsensitive = FunctionsStringSearch<PositionImpl<PositionCaseInsensitiveASCII>, NamePositionCaseInsensitive>;
 using FunctionPositionCaseInsensitiveUTF8
    = FunctionsStringSearch<PositionImpl<PositionCaseInsensitiveUTF8>, NamePositionCaseInsensitiveUTF8>;
 using FunctionMultiSearchAllPositions
    = FunctionsMultiStringPosition<MultiSearchAllPositionsImpl<PositionCaseSensitiveASCII>, NameMultiSearchAllPositions>;
 using FunctionMultiSearchAllPositionsUTF8
    = FunctionsMultiStringPosition<MultiSearchAllPositionsImpl<PositionCaseSensitiveUTF8>, NameMultiSearchAllPositionsUTF8>;
 using FunctionMultiSearchAllPositionsCaseInsensitive
    = FunctionsMultiStringPosition<MultiSearchAllPositionsImpl<PositionCaseInsensitiveASCII>, NameMultiSearchAllPositionsCaseInsensitive>;
 using FunctionMultiSearchAllPositionsCaseInsensitiveUTF8 = FunctionsMultiStringPosition<
    MultiSearchAllPositionsImpl<PositionCaseInsensitiveUTF8>,
    NameMultiSearchAllPositionsCaseInsensitiveUTF8>;
 using FunctionMultiSearch = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseSensitiveASCII>, NameMultiSearchAny>;
 using FunctionMultiSearchUTF8 = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseSensitiveUTF8>, NameMultiSearchAnyUTF8>;
 using FunctionMultiSearchCaseInsensitive
    = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseInsensitiveASCII>, NameMultiSearchAnyCaseInsensitive>;
 using FunctionMultiSearchCaseInsensitiveUTF8
    = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseInsensitiveUTF8>, NameMultiSearchAnyCaseInsensitiveUTF8>;
 using FunctionMultiSearchFirstIndex
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseSensitiveASCII>, NameMultiSearchFirstIndex>;
 using FunctionMultiSearchFirstIndexUTF8
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseSensitiveUTF8>, NameMultiSearchFirstIndexUTF8>;
 using FunctionMultiSearchFirstIndexCaseInsensitive
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseInsensitiveASCII>, NameMultiSearchFirstIndexCaseInsensitive>;
 using FunctionMultiSearchFirstIndexCaseInsensitiveUTF8
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseInsensitiveUTF8>, NameMultiSearchFirstIndexCaseInsensitiveUTF8>;
 using FunctionMultiSearchFirstPosition
    = FunctionsMultiStringSearch<MultiSearchFirstPositionImpl<PositionCaseSensitiveASCII>, NameMultiSearchFirstPosition>;
 using FunctionMultiSearchFirstPositionUTF8
    = FunctionsMultiStringSearch<MultiSearchFirstPositionImpl<PositionCaseSensitiveUTF8>, NameMultiSearchFirstPositionUTF8>;
 using FunctionMultiSearchFirstPositionCaseInsensitive
    = FunctionsMultiStringSearch<MultiSearchFirstPositionImpl<PositionCaseInsensitiveASCII>, NameMultiSearchFirstPositionCaseInsensitive>;
 using FunctionMultiSearchFirstPositionCaseInsensitiveUTF8 = FunctionsMultiStringSearch<
    MultiSearchFirstPositionImpl<PositionCaseInsensitiveUTF8>,
    NameMultiSearchFirstPositionCaseInsensitiveUTF8>;
 using FunctionHasToken = FunctionsStringSearch<HasTokenImpl<VolnitskyCaseSensitiveToken, false>, NameHasToken>;
 using FunctionHasTokenCaseInsensitive
    = FunctionsStringSearch<HasTokenImpl<VolnitskyCaseInsensitiveToken, false>, NameHasTokenCaseInsensitive>;
 void registerFunctionsStringSearch(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionPosition>(FunctionFactory::CaseInsensitive);
    factory.registerFunction<FunctionPositionUTF8>();
    factory.registerFunction<FunctionPositionCaseInsensitive>();
    factory.registerFunction<FunctionPositionCaseInsensitiveUTF8>();
    factory.registerFunction<FunctionMultiSearchAllPositions>();
    factory.registerFunction<FunctionMultiSearchAllPositionsUTF8>();
    factory.registerFunction<FunctionMultiSearchAllPositionsCaseInsensitive>();
    factory.registerFunction<FunctionMultiSearchAllPositionsCaseInsensitiveUTF8>();
    factory.registerFunction<FunctionMultiSearch>();
    factory.registerFunction<FunctionMultiSearchUTF8>();
    factory.registerFunction<FunctionMultiSearchCaseInsensitive>();
    factory.registerFunction<FunctionMultiSearchCaseInsensitiveUTF8>();
    factory.registerFunction<FunctionMultiSearchFirstIndex>();
    factory.registerFunction<FunctionMultiSearchFirstIndexUTF8>();
    factory.registerFunction<FunctionMultiSearchFirstIndexCaseInsensitive>();
    factory.registerFunction<FunctionMultiSearchFirstIndexCaseInsensitiveUTF8>();
    factory.registerFunction<FunctionMultiSearchFirstPosition>();
    factory.registerFunction<FunctionMultiSearchFirstPositionUTF8>();
    factory.registerFunction<FunctionMultiSearchFirstPositionCaseInsensitive>();
    factory.registerFunction<FunctionMultiSearchFirstPositionCaseInsensitiveUTF8>();
    factory.registerFunction<FunctionHasToken>();
    factory.registerFunction<FunctionHasTokenCaseInsensitive>();
    factory.registerAlias("locate", NamePosition::name, FunctionFactory::CaseInsensitive);
 }
 }
--- a/dbms/src/Functions/FunctionsStringSearch.h
+++ b/dbms/src/Functions/FunctionsStringSearch.h
@ -1,6 +1,5 @@
 #pragma once
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnFixedString.h>
@ -10,9 +9,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunctionImpl.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Context.h>
 #include <common/StringRef.h>
 namespace DB
@ -37,40 +34,12 @@ namespace DB
  * - the zero subpattern (the match part, otherwise);
  * - if not match - an empty string.
  * extract(haystack, pattern)
  *
  * replaceOne(haystack, pattern, replacement) - replacing the pattern with the specified rules, only the first occurrence.
  * replaceAll(haystack, pattern, replacement) - replacing the pattern with the specified rules, all occurrences.
  *
  * replaceRegexpOne(haystack, pattern, replacement) - replaces the pattern with the specified regexp, only the first occurrence.
  * replaceRegexpAll(haystack, pattern, replacement) - replaces the pattern with the specified type, all occurrences.
  *
  * multiSearchAllPositions(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- find first occurrences (positions) of all the const patterns inside haystack
  * multiSearchAllPositionsUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAllPositionsCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAllPositionsCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  *
  * multiSearchFirstPosition(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- returns the first position of the haystack matched by strings or zero if nothing was found
  * multiSearchFirstPositionUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstPositionCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstPositionCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  *
  * multiSearchAny(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- find any of the const patterns inside haystack and return 0 or 1
  * multiSearchAnyUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAnyCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchAnyCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndex(haystack, [pattern_1, pattern_2, ..., pattern_n]) -- returns the first index of the matched string or zero if nothing was found
  * multiSearchFirstIndexUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndexCaseInsensitive(haystack, [pattern_1, pattern_2, ..., pattern_n])
  * multiSearchFirstIndexCaseInsensitiveUTF8(haystack, [pattern_1, pattern_2, ..., pattern_n])
  */
 namespace ErrorCodes
 {
    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
    extern const int ILLEGAL_COLUMN;
    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
    extern const int FUNCTION_NOT_ALLOWED;
 }
 template <typename Impl, typename Name>
@ -163,224 +132,4 @@ public:
    }
 };
 template <typename Impl, typename Name>
 class FunctionsStringSearchToString : public IFunction
 {
 public:
    static constexpr auto name = Name::name;
    static FunctionPtr create(const Context &) { return std::make_shared<FunctionsStringSearchToString>(); }
    String getName() const override { return name; }
    size_t getNumberOfArguments() const override { return 2; }
    bool useDefaultImplementationForConstants() const override { return true; }
    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
        if (!isString(arguments[0]))
            throw Exception(
                "Illegal type " + arguments[0]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        if (!isString(arguments[1]))
            throw Exception(
                "Illegal type " + arguments[1]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        return std::make_shared<DataTypeString>();
    }
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) override
    {
        const ColumnPtr column = block.getByPosition(arguments[0]).column;
        const ColumnPtr column_needle = block.getByPosition(arguments[1]).column;
        const ColumnConst * col_needle = typeid_cast<const ColumnConst *>(&*column_needle);
        if (!col_needle)
            throw Exception("Second argument of function " + getName() + " must be constant string", ErrorCodes::ILLEGAL_COLUMN);
        if (const ColumnString * col = checkAndGetColumn<ColumnString>(column.get()))
        {
            auto col_res = ColumnString::create();
            ColumnString::Chars & vec_res = col_res->getChars();
            ColumnString::Offsets & offsets_res = col_res->getOffsets();
            Impl::vector(col->getChars(), col->getOffsets(), col_needle->getValue<String>(), vec_res, offsets_res);
            block.getByPosition(result).column = std::move(col_res);
        }
        else
            throw Exception(
                "Illegal column " + block.getByPosition(arguments[0]).column->getName() + " of argument of function " + getName(),
                ErrorCodes::ILLEGAL_COLUMN);
    }
 };
 template <typename Impl, typename Name>
 class FunctionsMultiStringPosition : public IFunction
 {
 public:
    static constexpr auto name = Name::name;
    static FunctionPtr create(const Context &) { return std::make_shared<FunctionsMultiStringPosition>(); }
    String getName() const override { return name; }
    size_t getNumberOfArguments() const override { return 2; }
    bool useDefaultImplementationForConstants() const override { return true; }
    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
        if (!isString(arguments[0]))
            throw Exception(
                "Illegal type " + arguments[0]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(arguments[1].get());
        if (!array_type || !checkAndGetDataType<DataTypeString>(array_type->getNestedType().get()))
            throw Exception(
                "Illegal type " + arguments[1]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        return std::make_shared<DataTypeArray>(std::make_shared<DataTypeUInt64>());
    }
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) override
    {
        using ResultType = typename Impl::ResultType;
        const ColumnPtr & column_haystack = block.getByPosition(arguments[0]).column;
        const ColumnString * col_haystack_vector = checkAndGetColumn<ColumnString>(&*column_haystack);
        const ColumnPtr & arr_ptr = block.getByPosition(arguments[1]).column;
        const ColumnConst * col_const_arr = checkAndGetColumnConst<ColumnArray>(arr_ptr.get());
        if (!col_const_arr)
            throw Exception(
                "Illegal column " + block.getByPosition(arguments[1]).column->getName() + ". The array is not const",
                ErrorCodes::ILLEGAL_COLUMN);
        Array src_arr = col_const_arr->getValue<Array>();
        if (src_arr.size() > std::numeric_limits<UInt8>::max())
            throw Exception(
                "Number of arguments for function " + getName() + " doesn't match: passed " + std::to_string(src_arr.size())
                    + ", should be at most 255",
                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
        std::vector<StringRef> refs;
        for (const auto & el : src_arr)
            refs.emplace_back(el.get<String>());
        const size_t column_haystack_size = column_haystack->size();
        auto col_res = ColumnVector<ResultType>::create();
        auto col_offsets = ColumnArray::ColumnOffsets::create(column_haystack_size);
        auto & vec_res = col_res->getData();
        auto & offsets_res = col_offsets->getData();
        vec_res.resize(column_haystack_size * refs.size());
        if (col_haystack_vector)
            Impl::vectorConstant(col_haystack_vector->getChars(), col_haystack_vector->getOffsets(), refs, vec_res);
        else
            throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName(), ErrorCodes::ILLEGAL_COLUMN);
        size_t refs_size = refs.size();
        size_t accum = refs_size;
        for (size_t i = 0; i < column_haystack_size; ++i, accum += refs_size)
            offsets_res[i] = accum;
        block.getByPosition(result).column = ColumnArray::create(std::move(col_res), std::move(col_offsets));
    }
 };
 /// The argument limiting raises from Volnitsky searcher -- it is performance crucial to save only one byte for pattern number.
 /// But some other searchers use this function, for example, multiMatchAny -- hyperscan does not have such restrictions
 template <typename Impl, typename Name, size_t LimitArgs = std::numeric_limits<UInt8>::max()>
 class FunctionsMultiStringSearch : public IFunction
 {
    static_assert(LimitArgs > 0);
 public:
    static constexpr auto name = Name::name;
    static FunctionPtr create(const Context & context)
    {
        if (Impl::is_using_hyperscan && !context.getSettingsRef().allow_hyperscan)
            throw Exception(
                "Hyperscan functions are disabled, because setting 'allow_hyperscan' is set to 0", ErrorCodes::FUNCTION_NOT_ALLOWED);
        return std::make_shared<FunctionsMultiStringSearch>();
    }
    String getName() const override { return name; }
    size_t getNumberOfArguments() const override { return 2; }
    bool useDefaultImplementationForConstants() const override { return true; }
    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
        if (!isString(arguments[0]))
            throw Exception(
                "Illegal type " + arguments[0]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(arguments[1].get());
        if (!array_type || !checkAndGetDataType<DataTypeString>(array_type->getNestedType().get()))
            throw Exception(
                "Illegal type " + arguments[1]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        return Impl::getReturnType();
    }
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) override
    {
        using ResultType = typename Impl::ResultType;
        const ColumnPtr & column_haystack = block.getByPosition(arguments[0]).column;
        const ColumnString * col_haystack_vector = checkAndGetColumn<ColumnString>(&*column_haystack);
        const ColumnPtr & arr_ptr = block.getByPosition(arguments[1]).column;
        const ColumnConst * col_const_arr = checkAndGetColumnConst<ColumnArray>(arr_ptr.get());
        if (!col_const_arr)
            throw Exception(
                "Illegal column " + block.getByPosition(arguments[1]).column->getName() + ". The array is not const",
                ErrorCodes::ILLEGAL_COLUMN);
        Array src_arr = col_const_arr->getValue<Array>();
        if (src_arr.size() > LimitArgs)
            throw Exception(
                "Number of arguments for function " + getName() + " doesn't match: passed " + std::to_string(src_arr.size())
                    + ", should be at most " + std::to_string(LimitArgs),
                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
        std::vector<StringRef> refs;
        refs.reserve(src_arr.size());
        for (const auto & el : src_arr)
            refs.emplace_back(el.get<String>());
        auto col_res = ColumnVector<ResultType>::create();
        auto col_offsets = ColumnArray::ColumnOffsets::create();
        auto & vec_res = col_res->getData();
        auto & offsets_res = col_offsets->getData();
        /// The blame for resizing output is for the callee.
        if (col_haystack_vector)
            Impl::vectorConstant(col_haystack_vector->getChars(), col_haystack_vector->getOffsets(), refs, vec_res, offsets_res);
        else
            throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName(), ErrorCodes::ILLEGAL_COLUMN);
        if constexpr (Impl::is_column_array)
            block.getByPosition(result).column = ColumnArray::create(std::move(col_res), std::move(col_offsets));
        else
            block.getByPosition(result).column = std::move(col_res);
    }
 };
 }
--- a/dbms/src/Functions/FunctionsStringSearchToString.h
+++ b/dbms/src/Functions/FunctionsStringSearchToString.h
@ -0,0 +1,87 @@
 #pragma once
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnVector.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunctionImpl.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Context.h>
 #include <common/StringRef.h>
 namespace DB
 {
 /** Applies regexp re2 and extracts:
  * - the first subpattern, if the regexp has a subpattern;
  * - the zero subpattern (the match part, otherwise);
  * - if not match - an empty string.
  * extract(haystack, pattern)
  */
 namespace ErrorCodes
 {
    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
    extern const int ILLEGAL_COLUMN;
 }
 template <typename Impl, typename Name>
 class FunctionsStringSearchToString : public IFunction
 {
 public:
    static constexpr auto name = Name::name;
    static FunctionPtr create(const Context &) { return std::make_shared<FunctionsStringSearchToString>(); }
    String getName() const override { return name; }
    size_t getNumberOfArguments() const override { return 2; }
    bool useDefaultImplementationForConstants() const override { return true; }
    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
    {
        if (!isString(arguments[0]))
            throw Exception(
                "Illegal type " + arguments[0]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        if (!isString(arguments[1]))
            throw Exception(
                "Illegal type " + arguments[1]->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        return std::make_shared<DataTypeString>();
    }
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /*input_rows_count*/) override
    {
        const ColumnPtr column = block.getByPosition(arguments[0]).column;
        const ColumnPtr column_needle = block.getByPosition(arguments[1]).column;
        const ColumnConst * col_needle = typeid_cast<const ColumnConst *>(&*column_needle);
        if (!col_needle)
            throw Exception("Second argument of function " + getName() + " must be constant string", ErrorCodes::ILLEGAL_COLUMN);
        if (const ColumnString * col = checkAndGetColumn<ColumnString>(column.get()))
        {
            auto col_res = ColumnString::create();
            ColumnString::Chars & vec_res = col_res->getChars();
            ColumnString::Offsets & offsets_res = col_res->getOffsets();
            Impl::vector(col->getChars(), col->getOffsets(), col_needle->getValue<String>(), vec_res, offsets_res);
            block.getByPosition(result).column = std::move(col_res);
        }
        else
            throw Exception(
                "Illegal column " + block.getByPosition(arguments[0]).column->getName() + " of argument of function " + getName(),
                ErrorCodes::ILLEGAL_COLUMN);
    }
 };
 }
--- a/dbms/src/Functions/HasTokenImpl.h
+++ b/dbms/src/Functions/HasTokenImpl.h
@ -0,0 +1,83 @@
 #pragma once
 #include <Columns/ColumnString.h>
 namespace DB
 {
 namespace ErrorCodes
 {
    extern const int ILLEGAL_COLUMN;
 }
 /** Token search the string, means that needle must be surrounded by some separator chars, like whitespace or puctuation.
  */
 template <typename TokenSearcher, bool negate_result = false>
 struct HasTokenImpl
 {
    using ResultType = UInt8;
    static constexpr bool use_default_implementation_for_constants = true;
    static void vectorConstant(
        const ColumnString::Chars & data, const ColumnString::Offsets & offsets, const std::string & pattern, PaddedPODArray<UInt8> & res)
    {
        if (offsets.empty())
            return;
        const UInt8 * begin = data.data();
        const UInt8 * pos = begin;
        const UInt8 * end = pos + data.size();
        /// The current index in the array of strings.
        size_t i = 0;
        TokenSearcher searcher(pattern.data(), pattern.size(), end - pos);
        /// We will search for the next occurrence in all rows at once.
        while (pos < end && end != (pos = searcher.search(pos, end - pos)))
        {
            /// Let's determine which index it refers to.
            while (begin + offsets[i] <= pos)
            {
                res[i] = negate_result;
                ++i;
            }
            /// We check that the entry does not pass through the boundaries of strings.
            if (pos + pattern.size() < begin + offsets[i])
                res[i] = !negate_result;
            else
                res[i] = negate_result;
            pos = begin + offsets[i];
            ++i;
        }
        /// Tail, in which there can be no substring.
        if (i < res.size())
            memset(&res[i], negate_result, (res.size() - i) * sizeof(res[0]));
    }
    template <typename... Args>
    static void vectorVector(Args &&...)
    {
        throw Exception("Function 'hasToken' does not support non-constant needle argument", ErrorCodes::ILLEGAL_COLUMN);
    }
    /// Search different needles in single haystack.
    template <typename... Args>
    static void constantVector(Args &&...)
    {
        throw Exception("Function 'hasToken' does not support non-constant needle argument", ErrorCodes::ILLEGAL_COLUMN);
    }
    template <typename... Args>
    static void vectorFixedConstant(Args &&...)
    {
        throw Exception("Functions 'hasToken' don't support FixedString haystack argument", ErrorCodes::ILLEGAL_COLUMN);
    }
 };
 }
--- a/dbms/src/Functions/MultiSearchAllPositionsImpl.h
+++ b/dbms/src/Functions/MultiSearchAllPositionsImpl.h
@ -0,0 +1,48 @@
 #pragma once
 #include <vector>
 #include <Columns/ColumnString.h>
 namespace DB
 {
 template <typename Impl>
 struct MultiSearchAllPositionsImpl
 {
    using ResultType = UInt64;
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt64> & res)
    {
        auto res_callback = [](const UInt8 * start, const UInt8 * end) -> UInt64
        {
            return 1 + Impl::countChars(reinterpret_cast<const char *>(start), reinterpret_cast<const char *>(end));
        };
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        const size_t needles_size = needles.size();
        /// Something can be uninitialized after the search itself
        std::fill(res.begin(), res.end(), 0);
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0, from = 0; j < haystack_string_size; ++j, from += needles_size)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                searcher.searchOneAll(haystack, haystack_end, res.data() + from, res_callback);
                prev_offset = haystack_offsets[j];
            }
        }
    }
 };
 }
--- a/dbms/src/Functions/MultiSearchFirstIndexImpl.h
+++ b/dbms/src/Functions/MultiSearchFirstIndexImpl.h
@ -0,0 +1,48 @@
 #pragma once
 #include <vector>
 #include <Columns/ColumnString.h>
 namespace DB
 {
 template <typename Impl>
 struct MultiSearchFirstIndexImpl
 {
    using ResultType = UInt64;
    static constexpr bool is_using_hyperscan = false;
    /// Variable for understanding, if we used offsets for the output, most
    /// likely to determine whether the function returns ColumnVector of ColumnArray.
    static constexpr bool is_column_array = false;
    static auto getReturnType() { return std::make_shared<DataTypeNumber<ResultType>>(); }
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt64> & res,
        [[maybe_unused]] PaddedPODArray<UInt64> & offsets)
    {
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        res.resize(haystack_string_size);
        size_t iteration = 0;
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0; j < haystack_string_size; ++j)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                /// hasMoreToSearch traverse needles in increasing order
                if (iteration == 0 || res[j] == 0)
                    res[j] = searcher.searchOneFirstIndex(haystack, haystack_end);
                prev_offset = haystack_offsets[j];
            }
            ++iteration;
        }
    }
 };
 }
--- a/dbms/src/Functions/MultiSearchFirstPositionImpl.h
+++ b/dbms/src/Functions/MultiSearchFirstPositionImpl.h
@ -0,0 +1,57 @@
 #pragma once
 #include <vector>
 #include <Columns/ColumnString.h>
 namespace DB
 {
 template <typename Impl>
 struct MultiSearchFirstPositionImpl
 {
    using ResultType = UInt64;
    static constexpr bool is_using_hyperscan = false;
    /// Variable for understanding, if we used offsets for the output, most
    /// likely to determine whether the function returns ColumnVector of ColumnArray.
    static constexpr bool is_column_array = false;
    static auto getReturnType() { return std::make_shared<DataTypeNumber<ResultType>>(); }
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt64> & res,
        [[maybe_unused]] PaddedPODArray<UInt64> & offsets)
    {
        auto res_callback = [](const UInt8 * start, const UInt8 * end) -> UInt64
        {
            return 1 + Impl::countChars(reinterpret_cast<const char *>(start), reinterpret_cast<const char *>(end));
        };
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        res.resize(haystack_string_size);
        size_t iteration = 0;
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0; j < haystack_string_size; ++j)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                if (iteration == 0 || res[j] == 0)
                    res[j] = searcher.searchOneFirstPosition(haystack, haystack_end, res_callback);
                else
                {
                    UInt64 result = searcher.searchOneFirstPosition(haystack, haystack_end, res_callback);
                    if (result != 0)
                        res[j] = std::min(result, res[j]);
                }
                prev_offset = haystack_offsets[j];
            }
            ++iteration;
        }
    }
 };
 }
--- a/dbms/src/Functions/MultiSearchImpl.h
+++ b/dbms/src/Functions/MultiSearchImpl.h
@ -0,0 +1,47 @@
 #pragma once
 #include <vector>
 #include <Columns/ColumnString.h>
 namespace DB
 {
 template <typename Impl>
 struct MultiSearchImpl
 {
    using ResultType = UInt8;
    static constexpr bool is_using_hyperscan = false;
    /// Variable for understanding, if we used offsets for the output, most
    /// likely to determine whether the function returns ColumnVector of ColumnArray.
    static constexpr bool is_column_array = false;
    static auto getReturnType() { return std::make_shared<DataTypeNumber<ResultType>>(); }
    static void vectorConstant(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const std::vector<StringRef> & needles,
        PaddedPODArray<UInt8> & res,
        [[maybe_unused]] PaddedPODArray<UInt64> & offsets)
    {
        auto searcher = Impl::createMultiSearcherInBigHaystack(needles);
        const size_t haystack_string_size = haystack_offsets.size();
        res.resize(haystack_string_size);
        size_t iteration = 0;
        while (searcher.hasMoreToSearch())
        {
            size_t prev_offset = 0;
            for (size_t j = 0; j < haystack_string_size; ++j)
            {
                const auto * haystack = &haystack_data[prev_offset];
                const auto * haystack_end = haystack + haystack_offsets[j] - prev_offset - 1;
                if (iteration == 0 || !res[j])
                    res[j] = searcher.searchOne(haystack, haystack_end);
                prev_offset = haystack_offsets[j];
            }
            ++iteration;
        }
    }
 };
 }
--- a/dbms/src/Functions/PositionImpl.h
+++ b/dbms/src/Functions/PositionImpl.h
@ -0,0 +1,307 @@
 #include "FunctionsStringSearch.h"
 #include <string>
 #include <vector>
 #include <Poco/UTF8String.h>
 #include <Common/Volnitsky.h>
 namespace DB
 {
 namespace ErrorCodes
 {
    extern const int ILLEGAL_COLUMN;
 }
 /** Implementation details for functions of 'position' family depending on ASCII/UTF8 and case sensitiveness.
  */
 struct PositionCaseSensitiveASCII
 {
    /// For searching single substring inside big-enough contiguous chunk of data. Coluld have slightly expensive initialization.
    using SearcherInBigHaystack = Volnitsky;
    /// For search many substrings in one string
    using MultiSearcherInBigHaystack = MultiVolnitsky;
    /// For searching single substring, that is different each time. This object is created for each row of data. It must have cheap initialization.
    using SearcherInSmallHaystack = LibCASCIICaseSensitiveStringSearcher;
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t haystack_size_hint)
    {
        return SearcherInBigHaystack(needle_data, needle_size, haystack_size_hint);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    /// Number of code points between 'begin' and 'end' (this has different behaviour for ASCII and UTF-8).
    static size_t countChars(const char * begin, const char * end) { return end - begin; }
    /// Convert string to lowercase. Only for case-insensitive search.
    /// Implementation is permitted to be inefficient because it is called for single string.
    static void toLowerIfNeed(std::string &) { }
 };
 struct PositionCaseInsensitiveASCII
 {
    /// `Volnitsky` is not used here, because one person has measured that this is better. It will be good if you question it.
    using SearcherInBigHaystack = ASCIICaseInsensitiveStringSearcher;
    using MultiSearcherInBigHaystack = MultiVolnitskyCaseInsensitive;
    using SearcherInSmallHaystack = LibCASCIICaseInsensitiveStringSearcher;
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t /*haystack_size_hint*/)
    {
        return SearcherInBigHaystack(needle_data, needle_size);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    static size_t countChars(const char * begin, const char * end) { return end - begin; }
    static void toLowerIfNeed(std::string & s) { std::transform(std::begin(s), std::end(s), std::begin(s), tolower); }
 };
 struct PositionCaseSensitiveUTF8
 {
    using SearcherInBigHaystack = VolnitskyUTF8;
    using MultiSearcherInBigHaystack = MultiVolnitskyUTF8;
    using SearcherInSmallHaystack = LibCASCIICaseSensitiveStringSearcher;
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t haystack_size_hint)
    {
        return SearcherInBigHaystack(needle_data, needle_size, haystack_size_hint);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    static size_t countChars(const char * begin, const char * end)
    {
        size_t res = 0;
        for (auto it = begin; it != end; ++it)
            if (!UTF8::isContinuationOctet(static_cast<UInt8>(*it)))
                ++res;
        return res;
    }
    static void toLowerIfNeed(std::string &) { }
 };
 struct PositionCaseInsensitiveUTF8
 {
    using SearcherInBigHaystack = VolnitskyCaseInsensitiveUTF8;
    using MultiSearcherInBigHaystack = MultiVolnitskyCaseInsensitiveUTF8;
    using SearcherInSmallHaystack = UTF8CaseInsensitiveStringSearcher; /// TODO Very suboptimal.
    static SearcherInBigHaystack createSearcherInBigHaystack(const char * needle_data, size_t needle_size, size_t haystack_size_hint)
    {
        return SearcherInBigHaystack(needle_data, needle_size, haystack_size_hint);
    }
    static SearcherInSmallHaystack createSearcherInSmallHaystack(const char * needle_data, size_t needle_size)
    {
        return SearcherInSmallHaystack(needle_data, needle_size);
    }
    static MultiSearcherInBigHaystack createMultiSearcherInBigHaystack(const std::vector<StringRef> & needles)
    {
        return MultiSearcherInBigHaystack(needles);
    }
    static size_t countChars(const char * begin, const char * end)
    {
        size_t res = 0;
        for (auto it = begin; it != end; ++it)
            if (!UTF8::isContinuationOctet(static_cast<UInt8>(*it)))
                ++res;
        return res;
    }
    static void toLowerIfNeed(std::string & s) { Poco::UTF8::toLowerInPlace(s); }
 };
 template <typename Impl>
 struct PositionImpl
 {
    static constexpr bool use_default_implementation_for_constants = false;
    using ResultType = UInt64;
    /// Find one substring in many strings.
    static void vectorConstant(
        const ColumnString::Chars & data, const ColumnString::Offsets & offsets, const std::string & needle, PaddedPODArray<UInt64> & res)
    {
        const UInt8 * begin = data.data();
        const UInt8 * pos = begin;
        const UInt8 * end = pos + data.size();
        /// Current index in the array of strings.
        size_t i = 0;
        typename Impl::SearcherInBigHaystack searcher = Impl::createSearcherInBigHaystack(needle.data(), needle.size(), end - pos);
        /// We will search for the next occurrence in all strings at once.
        while (pos < end && end != (pos = searcher.search(pos, end - pos)))
        {
            /// Determine which index it refers to.
            while (begin + offsets[i] <= pos)
            {
                res[i] = 0;
                ++i;
            }
            /// We check that the entry does not pass through the boundaries of strings.
            if (pos + needle.size() < begin + offsets[i])
                res[i] = 1 + Impl::countChars(reinterpret_cast<const char *>(begin + offsets[i - 1]), reinterpret_cast<const char *>(pos));
            else
                res[i] = 0;
            pos = begin + offsets[i];
            ++i;
        }
        if (i < res.size())
            memset(&res[i], 0, (res.size() - i) * sizeof(res[0]));
    }
    /// Search for substring in string.
    static void constantConstant(std::string data, std::string needle, UInt64 & res)
    {
        Impl::toLowerIfNeed(data);
        Impl::toLowerIfNeed(needle);
        res = data.find(needle);
        if (res == std::string::npos)
            res = 0;
        else
            res = 1 + Impl::countChars(data.data(), data.data() + res);
    }
    /// Search each time for a different single substring inside each time different string.
    static void vectorVector(
        const ColumnString::Chars & haystack_data,
        const ColumnString::Offsets & haystack_offsets,
        const ColumnString::Chars & needle_data,
        const ColumnString::Offsets & needle_offsets,
        PaddedPODArray<UInt64> & res)
    {
        ColumnString::Offset prev_haystack_offset = 0;
        ColumnString::Offset prev_needle_offset = 0;
        size_t size = haystack_offsets.size();
        for (size_t i = 0; i < size; ++i)
        {
            size_t needle_size = needle_offsets[i] - prev_needle_offset - 1;
            size_t haystack_size = haystack_offsets[i] - prev_haystack_offset - 1;
            if (0 == needle_size)
            {
                /// An empty string is always at the very beginning of `haystack`.
                res[i] = 1;
            }
            else
            {
                /// It is assumed that the StringSearcher is not very difficult to initialize.
                typename Impl::SearcherInSmallHaystack searcher = Impl::createSearcherInSmallHaystack(
                    reinterpret_cast<const char *>(&needle_data[prev_needle_offset]),
                    needle_offsets[i] - prev_needle_offset - 1); /// zero byte at the end
                /// searcher returns a pointer to the found substring or to the end of `haystack`.
                size_t pos = searcher.search(&haystack_data[prev_haystack_offset], &haystack_data[haystack_offsets[i] - 1])
                    - &haystack_data[prev_haystack_offset];
                if (pos != haystack_size)
                {
                    res[i] = 1
                        + Impl::countChars(
                                 reinterpret_cast<const char *>(&haystack_data[prev_haystack_offset]),
                                 reinterpret_cast<const char *>(&haystack_data[prev_haystack_offset + pos]));
                }
                else
                    res[i] = 0;
            }
            prev_haystack_offset = haystack_offsets[i];
            prev_needle_offset = needle_offsets[i];
        }
    }
    /// Find many substrings in single string.
    static void constantVector(
        const String & haystack,
        const ColumnString::Chars & needle_data,
        const ColumnString::Offsets & needle_offsets,
        PaddedPODArray<UInt64> & res)
    {
        // NOTE You could use haystack indexing. But this is a rare case.
        ColumnString::Offset prev_needle_offset = 0;
        size_t size = needle_offsets.size();
        for (size_t i = 0; i < size; ++i)
        {
            size_t needle_size = needle_offsets[i] - prev_needle_offset - 1;
            if (0 == needle_size)
            {
                res[i] = 1;
            }
            else
            {
                typename Impl::SearcherInSmallHaystack searcher = Impl::createSearcherInSmallHaystack(
                    reinterpret_cast<const char *>(&needle_data[prev_needle_offset]), needle_offsets[i] - prev_needle_offset - 1);
                size_t pos = searcher.search(
                                 reinterpret_cast<const UInt8 *>(haystack.data()),
                                 reinterpret_cast<const UInt8 *>(haystack.data()) + haystack.size())
                    - reinterpret_cast<const UInt8 *>(haystack.data());
                if (pos != haystack.size())
                {
                    res[i] = 1 + Impl::countChars(haystack.data(), haystack.data() + pos);
                }
                else
                    res[i] = 0;
            }
            prev_needle_offset = needle_offsets[i];
        }
    }
    template <typename... Args>
    static void vectorFixedConstant(Args &&...)
    {
        throw Exception("Functions 'position' don't support FixedString haystack argument", ErrorCodes::ILLEGAL_COLUMN);
    }
 };
 }
--- a/dbms/src/Functions/URL/cutURLParameter.cpp
+++ b/dbms/src/Functions/URL/cutURLParameter.cpp
@ -1,5 +1,5 @@
 #include <Functions/FunctionFactory.h>
-#include <Functions/FunctionsStringSearch.h>
+#include <Functions/FunctionsStringSearchToString.h>
 #include <common/find_symbols.h>
 namespace DB
--- a/dbms/src/Functions/URL/extractURLParameter.cpp
+++ b/dbms/src/Functions/URL/extractURLParameter.cpp
@ -1,5 +1,5 @@
 #include <Functions/FunctionFactory.h>
-#include <Functions/FunctionsStringSearch.h>
+#include <Functions/FunctionsStringSearchToString.h>
 #include <common/find_symbols.h>
 namespace DB
--- a/dbms/src/Functions/array/arrayReduce.cpp
+++ b/dbms/src/Functions/array/arrayReduce.cpp
@ -5,12 +5,10 @@
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnAggregateFunction.h>
 #include <IO/WriteHelpers.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <AggregateFunctions/AggregateFunctionState.h>
 #include <AggregateFunctions/IAggregateFunction.h>
 #include <AggregateFunctions/parseAggregateFunctionParameters.h>
 #include <Common/AlignedBuffer.h>
 #include <Common/Arena.h>
 #include <ext/scope_guard.h>
@ -108,7 +106,7 @@ DataTypePtr FunctionArrayReduce::getReturnTypeImpl(const ColumnsWithTypeAndName
 void FunctionArrayReduce::executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count)
 {
-    IAggregateFunction & agg_func = *aggregate_function.get();
+    IAggregateFunction & agg_func = *aggregate_function;
    std::unique_ptr<Arena> arena = std::make_unique<Arena>();
    /// Aggregate functions do not support constant columns. Therefore, we materialize them.
@ -132,7 +130,7 @@ void FunctionArrayReduce::executeImpl(Block & block, const ColumnNumbers & argum
        else if (const ColumnConst * const_arr = checkAndGetColumnConst<ColumnArray>(col))
        {
            materialized_columns.emplace_back(const_arr->convertToFullColumn());
-            const auto & materialized_arr = typeid_cast<const ColumnArray &>(*materialized_columns.back().get());
+            const auto & materialized_arr = typeid_cast<const ColumnArray &>(*materialized_columns.back());
            aggregate_arguments_vec[i] = &materialized_arr.getData();
            offsets_i = &materialized_arr.getOffsets();
        }
--- a/dbms/src/Functions/array/arrayReduceInRanges.cpp
+++ b/dbms/src/Functions/array/arrayReduceInRanges.cpp
@ -0,0 +1,394 @@
 #include <Functions/IFunctionImpl.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnAggregateFunction.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <AggregateFunctions/AggregateFunctionState.h>
 #include <AggregateFunctions/IAggregateFunction.h>
 #include <AggregateFunctions/parseAggregateFunctionParameters.h>
 #include <Common/Arena.h>
 #include <ext/scope_guard.h>
 namespace DB
 {
 namespace ErrorCodes
 {
    extern const int SIZES_OF_ARRAYS_DOESNT_MATCH;
    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
    extern const int ILLEGAL_COLUMN;
    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
    extern const int BAD_ARGUMENTS;
 }
 /** Applies an aggregate function to value ranges in the array.
  * The function does what arrayReduce do on a structure similar to segment tree.
  * Space complexity: n * log(n)
  *
  * arrayReduceInRanges('agg', indices, lengths, arr1, ...)
  */
 class FunctionArrayReduceInRanges : public IFunction
 {
 public:
    static const size_t minimum_step = 64;
    static constexpr auto name = "arrayReduceInRanges";
    static FunctionPtr create(const Context &) { return std::make_shared<FunctionArrayReduceInRanges>(); }
    String getName() const override { return name; }
    bool isVariadic() const override { return true; }
    size_t getNumberOfArguments() const override { return 0; }
    bool useDefaultImplementationForConstants() const override { return true; }
    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {0}; }
    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override;
    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count) override;
 private:
    /// lazy initialization in getReturnTypeImpl
    /// TODO: init in OverloadResolver
    mutable AggregateFunctionPtr aggregate_function;
 };
 DataTypePtr FunctionArrayReduceInRanges::getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const
 {
    /// The first argument is a constant string with the name of the aggregate function
    ///  (possibly with parameters in parentheses, for example: "quantile(0.99)").
    if (arguments.size() < 3)
        throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
            + toString(arguments.size()) + ", should be at least 3.",
            ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
    const ColumnConst * aggregate_function_name_column = checkAndGetColumnConst<ColumnString>(arguments[0].column.get());
    if (!aggregate_function_name_column)
        throw Exception("First argument for function " + getName() + " must be constant string: name of aggregate function.",
            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
    const DataTypeArray * ranges_type_array = checkAndGetDataType<DataTypeArray>(arguments[1].type.get());
    if (!ranges_type_array)
        throw Exception("Second argument for function " + getName() + " must be an array of ranges.",
            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
    const DataTypeTuple * ranges_type_tuple = checkAndGetDataType<DataTypeTuple>(ranges_type_array->getNestedType().get());
    if (!ranges_type_tuple || ranges_type_tuple->getElements().size() != 2)
        throw Exception("Each array element in the second argument for function " + getName() + " must be a tuple (index, length).",
            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
    if (!isNativeInteger(ranges_type_tuple->getElements()[0]))
        throw Exception("First tuple member in the second argument for function " + getName() + " must be ints or uints.",
            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
    if (!WhichDataType(ranges_type_tuple->getElements()[1]).isNativeUInt())
        throw Exception("Second tuple member in the second argument for function " + getName() + " must be uints.",
            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
    DataTypes argument_types(arguments.size() - 2);
    for (size_t i = 2, size = arguments.size(); i < size; ++i)
    {
        const DataTypeArray * arg = checkAndGetDataType<DataTypeArray>(arguments[i].type.get());
        if (!arg)
            throw Exception("Argument " + toString(i) + " for function " + getName() + " must be an array but it has type "
                + arguments[i].type->getName() + ".", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
        argument_types[i - 2] = arg->getNestedType();
    }
    if (!aggregate_function)
    {
        String aggregate_function_name_with_params = aggregate_function_name_column->getValue<String>();
        if (aggregate_function_name_with_params.empty())
            throw Exception("First argument for function " + getName() + " (name of aggregate function) cannot be empty.",
                ErrorCodes::BAD_ARGUMENTS);
        String aggregate_function_name;
        Array params_row;
        getAggregateFunctionNameAndParametersArray(aggregate_function_name_with_params,
                                                   aggregate_function_name, params_row, "function " + getName());
        aggregate_function = AggregateFunctionFactory::instance().get(aggregate_function_name, argument_types, params_row);
    }
    return std::make_shared<DataTypeArray>(aggregate_function->getReturnType());
 }
 void FunctionArrayReduceInRanges::executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count)
 {
    IAggregateFunction & agg_func = *aggregate_function;
    std::unique_ptr<Arena> arena = std::make_unique<Arena>();
    /// Aggregate functions do not support constant columns. Therefore, we materialize them.
    std::vector<ColumnPtr> materialized_columns;
    /// Handling ranges
    const IColumn * ranges_col_array = block.getByPosition(arguments[1]).column.get();
    const IColumn * ranges_col_tuple = nullptr;
    const ColumnArray::Offsets * ranges_offsets = nullptr;
    if (const ColumnArray * arr = checkAndGetColumn<ColumnArray>(ranges_col_array))
    {
        ranges_col_tuple = &arr->getData();
        ranges_offsets = &arr->getOffsets();
    }
    else if (const ColumnConst * const_arr = checkAndGetColumnConst<ColumnArray>(ranges_col_array))
    {
        materialized_columns.emplace_back(const_arr->convertToFullColumn());
        const auto & materialized_arr = typeid_cast<const ColumnArray &>(*materialized_columns.back());
        ranges_col_tuple = &materialized_arr.getData();
        ranges_offsets = &materialized_arr.getOffsets();
    }
    else
        throw Exception("Illegal column " + ranges_col_array->getName() + " as argument of function " + getName(), ErrorCodes::ILLEGAL_COLUMN);
    const IColumn & indices_col = static_cast<const ColumnTuple *>(ranges_col_tuple)->getColumn(0);
    const IColumn & lengths_col = static_cast<const ColumnTuple *>(ranges_col_tuple)->getColumn(1);
    /// Handling arguments
    /// The code is mostly copied from `arrayReduce`. Maybe create a utility header?
    const size_t num_arguments_columns = arguments.size() - 2;
    std::vector<const IColumn *> aggregate_arguments_vec(num_arguments_columns);
    const ColumnArray::Offsets * offsets = nullptr;
    for (size_t i = 0; i < num_arguments_columns; ++i)
    {
        const IColumn * col = block.getByPosition(arguments[i + 2]).column.get();
        const ColumnArray::Offsets * offsets_i = nullptr;
        if (const ColumnArray * arr = checkAndGetColumn<ColumnArray>(col))
        {
            aggregate_arguments_vec[i] = &arr->getData();
            offsets_i = &arr->getOffsets();
        }
        else if (const ColumnConst * const_arr = checkAndGetColumnConst<ColumnArray>(col))
        {
            materialized_columns.emplace_back(const_arr->convertToFullColumn());
            const auto & materialized_arr = typeid_cast<const ColumnArray &>(*materialized_columns.back());
            aggregate_arguments_vec[i] = &materialized_arr.getData();
            offsets_i = &materialized_arr.getOffsets();
        }
        else
            throw Exception("Illegal column " + col->getName() + " as argument of function " + getName(), ErrorCodes::ILLEGAL_COLUMN);
        if (i == 0)
            offsets = offsets_i;
        else if (*offsets_i != *offsets)
            throw Exception("Lengths of all arrays passed to " + getName() + " must be equal.",
                ErrorCodes::SIZES_OF_ARRAYS_DOESNT_MATCH);
    }
    const IColumn ** aggregate_arguments = aggregate_arguments_vec.data();
    /// Handling results
    MutableColumnPtr result_holder = block.getByPosition(result).type->createColumn();
    ColumnArray * result_arr = static_cast<ColumnArray *>(result_holder.get());
    IColumn & result_data = result_arr->getData();
    result_arr->getOffsets().insert(ranges_offsets->begin(), ranges_offsets->end());
    /// AggregateFunction's states should be inserted into column using specific way
    auto res_col_aggregate_function = typeid_cast<ColumnAggregateFunction *>(&result_data);
    if (!res_col_aggregate_function && agg_func.isState())
        throw Exception("State function " + agg_func.getName() + " inserts results into non-state column "
                        + block.getByPosition(result).type->getName(), ErrorCodes::ILLEGAL_COLUMN);
    /// Perform the aggregation
    size_t begin = 0;
    size_t end = 0;
    size_t ranges_begin = 0;
    size_t ranges_end = 0;
    for (size_t i = 0; i < input_rows_count; ++i)
    {
        begin = end;
        end = (*offsets)[i];
        ranges_begin = ranges_end;
        ranges_end = (*ranges_offsets)[i];
        /// We will allocate pre-aggregation places for each `minimum_place << level` rows.
        /// The value of `level` starts from 0, and it will never exceed the number of bits in a `size_t`.
        /// We calculate the offset (and thus size) of those places in each level.
        size_t place_offsets[sizeof(size_t) * 8];
        size_t place_total = 0;
        {
            size_t place_in_level = (end - begin) / minimum_step;
            place_offsets[0] = place_in_level;
            for (size_t level = 0; place_in_level; ++level)
            {
                place_in_level >>= 1;
                place_total = place_offsets[level] + place_in_level;
                place_offsets[level + 1] = place_total;
            }
        }
        PODArray<AggregateDataPtr> places(place_total);
        for (size_t j = 0; j < place_total; ++j)
        {
            places[j] = arena->alignedAlloc(agg_func.sizeOfData(), agg_func.alignOfData());
            try
            {
                agg_func.create(places[j]);
            }
            catch (...)
            {
                for (size_t k = 0; k < j; ++k)
                    agg_func.destroy(places[k]);
                throw;
            }
        }
        SCOPE_EXIT({
            for (size_t j = 0; j < place_total; ++j)
                agg_func.destroy(places[j]);
        });
        auto true_func = &agg_func;
        /// Unnest consecutive trailing -State combinators
        while (auto func = typeid_cast<AggregateFunctionState *>(true_func))
            true_func = func->getNestedFunction().get();
        /// Pre-aggregate to the initial level
        for (size_t j = 0; j < place_offsets[0]; ++j)
        {
            size_t local_begin = j * minimum_step;
            size_t local_end = (j + 1) * minimum_step;
            for (size_t k = local_begin; k < local_end; ++k)
                true_func->add(places[j], aggregate_arguments, begin + k, arena.get());
        }
        /// Pre-aggregate to the higher levels by merging
        {
            size_t place_in_level = place_offsets[0] >> 1;
            size_t place_begin = 0;
            for (size_t level = 0; place_in_level; ++level)
            {
                size_t next_place_begin = place_offsets[level];
                for (size_t j = 0; j < place_in_level; ++j)
                {
                    true_func->merge(places[next_place_begin + j], places[place_begin + (j << 1)], arena.get());
                    true_func->merge(places[next_place_begin + j], places[place_begin + (j << 1) + 1], arena.get());
                }
                place_in_level >>= 1;
                place_begin = next_place_begin;
            }
        }
        for (size_t j = ranges_begin; j < ranges_end; ++j)
        {
            size_t local_begin = 0;
            size_t local_end = 0;
            {
                Int64 index = indices_col.getInt(j);
                UInt64 length = lengths_col.getUInt(j);
                /// Keep the same as in arraySlice
                if (index > 0)
                {
                    local_begin = index - 1;
                    if (local_begin + length < end - begin)
                        local_end = local_begin + length;
                    else
                        local_end = end - begin;
                }
                else if (index < 0)
                {
                    if (end - begin + index > 0)
                        local_begin = end - begin + index;
                    else
                        local_begin = 0;
                    if (local_begin + length < end - begin)
                        local_end = local_begin + length;
                    else
                        local_end = end - begin;
                }
            }
            size_t place_begin = (local_begin + minimum_step - 1) / minimum_step;
            size_t place_end = local_end / minimum_step;
            AggregateDataPtr place = arena->alignedAlloc(agg_func.sizeOfData(), agg_func.alignOfData());
            agg_func.create(place);
            SCOPE_EXIT({
                agg_func.destroy(place);
            });
            if (place_begin < place_end)
            {
                /// In this case, we can use pre-aggregated data.
                /// Aggregate rows before
                for (size_t k = local_begin; k < place_begin * minimum_step; ++k)
                    true_func->add(place, aggregate_arguments, begin + k, arena.get());
                /// Aggregate using pre-aggretated data
                {
                    size_t level = 0;
                    size_t place_curr = place_begin;
                    while (place_curr < place_end)
                    {
                        while (((place_curr >> level) & 1) == 0 && place_curr + (2 << level) <= place_end)
                            level += 1;
                        while (place_curr + (1 << level) > place_end)
                            level -= 1;
                        size_t place_offset = 0;
                        if (level)
                            place_offset = place_offsets[level - 1];
                        true_func->merge(place, places[place_offset + (place_curr >> level)], arena.get());
                        place_curr += 1 << level;
                    }
                }
                /// Aggregate rows after
                for (size_t k = place_end * minimum_step; k < local_end; ++k)
                    true_func->add(place, aggregate_arguments, begin + k, arena.get());
            }
            else
            {
                /// In this case, we can not use pre-aggregated data.
                for (size_t k = local_begin; k < local_end; ++k)
                    true_func->add(place, aggregate_arguments, begin + k, arena.get());
            }
            if (!res_col_aggregate_function)
                agg_func.insertResultInto(place, result_data);
            else
                res_col_aggregate_function->insertFrom(place);
        }
    }
    block.getByPosition(result).column = std::move(result_holder);
 }
 void registerFunctionArrayReduceInRanges(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionArrayReduceInRanges>();
 }
 }
--- a/dbms/src/Functions/array/registerFunctionsArray.cpp
+++ b/dbms/src/Functions/array/registerFunctionsArray.cpp
@ -33,6 +33,7 @@ void registerFunctionArrayFlatten(FunctionFactory &);
 void registerFunctionArrayWithConstant(FunctionFactory &);
 void registerFunctionArrayZip(FunctionFactory &);
 void registerFunctionArrayAUC(FunctionFactory &);
 void registerFunctionArrayReduceInRanges(FunctionFactory &);
 void registerFunctionsArray(FunctionFactory & factory)
 {
@ -53,6 +54,7 @@ void registerFunctionsArray(FunctionFactory & factory)
    registerFunctionArraySlice(factory);
    registerFunctionArrayReverse(factory);
    registerFunctionArrayReduce(factory);
    registerFunctionArrayReduceInRanges(factory);
    registerFunctionRange(factory);
    registerFunctionsEmptyArray(factory);
    registerFunctionEmptyArrayToSingle(factory);
--- a/dbms/src/Functions/hasToken.cpp
+++ b/dbms/src/Functions/hasToken.cpp
@ -0,0 +1,22 @@
 #include "FunctionsStringSearch.h"
 #include <Functions/FunctionFactory.h>
 #include "HasTokenImpl.h"
 #include <Common/Volnitsky.h>
 namespace DB
 {
 struct NameHasToken
 {
    static constexpr auto name = "hasToken";
 };
 using FunctionHasToken = FunctionsStringSearch<HasTokenImpl<VolnitskyCaseSensitiveToken, false>, NameHasToken>;
 void registerFunctionHasToken(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionHasToken>();
 }
 }
--- a/dbms/src/Functions/hasTokenCaseInsensitive.cpp
+++ b/dbms/src/Functions/hasTokenCaseInsensitive.cpp
@ -0,0 +1,23 @@
 #include "FunctionsStringSearch.h"
 #include <Functions/FunctionFactory.h>
 #include "HasTokenImpl.h"
 #include <Common/Volnitsky.h>
 namespace DB
 {
 struct NameHasTokenCaseInsensitive
 {
    static constexpr auto name = "hasTokenCaseInsensitive";
 };
 using FunctionHasTokenCaseInsensitive
    = FunctionsStringSearch<HasTokenImpl<VolnitskyCaseInsensitiveToken, false>, NameHasTokenCaseInsensitive>;
 void registerFunctionHasTokenCaseInsensitive(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionHasTokenCaseInsensitive>();
 }
 }
--- a/dbms/src/Functions/multiSearchAllPositions.cpp
+++ b/dbms/src/Functions/multiSearchAllPositions.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringPosition.h"
 #include "FunctionFactory.h"
 #include "MultiSearchAllPositionsImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAllPositions
 {
    static constexpr auto name = "multiSearchAllPositions";
 };
 using FunctionMultiSearchAllPositions
    = FunctionsMultiStringPosition<MultiSearchAllPositionsImpl<PositionCaseSensitiveASCII>, NameMultiSearchAllPositions>;
 void registerFunctionMultiSearchAllPositions(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchAllPositions>();
 }
 }
--- a/dbms/src/Functions/multiSearchAllPositionsCaseInsensitive.cpp
+++ b/dbms/src/Functions/multiSearchAllPositionsCaseInsensitive.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringPosition.h"
 #include "FunctionFactory.h"
 #include "MultiSearchAllPositionsImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAllPositionsCaseInsensitive
 {
    static constexpr auto name = "multiSearchAllPositionsCaseInsensitive";
 };
 using FunctionMultiSearchAllPositionsCaseInsensitive
    = FunctionsMultiStringPosition<MultiSearchAllPositionsImpl<PositionCaseInsensitiveASCII>, NameMultiSearchAllPositionsCaseInsensitive>;
 void registerFunctionMultiSearchAllPositionsCaseInsensitive(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchAllPositionsCaseInsensitive>();
 }
 }
--- a/dbms/src/Functions/multiSearchAllPositionsCaseInsensitiveUTF8.cpp
+++ b/dbms/src/Functions/multiSearchAllPositionsCaseInsensitiveUTF8.cpp
@ -0,0 +1,24 @@
 #include "FunctionsMultiStringPosition.h"
 #include "FunctionFactory.h"
 #include "MultiSearchAllPositionsImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAllPositionsCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchAllPositionsCaseInsensitiveUTF8";
 };
 using FunctionMultiSearchAllPositionsCaseInsensitiveUTF8 = FunctionsMultiStringPosition<
    MultiSearchAllPositionsImpl<PositionCaseInsensitiveUTF8>,
    NameMultiSearchAllPositionsCaseInsensitiveUTF8>;
 void registerFunctionMultiSearchAllPositionsCaseInsensitiveUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchAllPositionsCaseInsensitiveUTF8>();
 }
 }
--- a/dbms/src/Functions/multiSearchAllPositionsUTF8.cpp
+++ b/dbms/src/Functions/multiSearchAllPositionsUTF8.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringPosition.h"
 #include "FunctionFactory.h"
 #include "MultiSearchAllPositionsImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAllPositionsUTF8
 {
    static constexpr auto name = "multiSearchAllPositionsUTF8";
 };
 using FunctionMultiSearchAllPositionsUTF8
    = FunctionsMultiStringPosition<MultiSearchAllPositionsImpl<PositionCaseSensitiveUTF8>, NameMultiSearchAllPositionsUTF8>;
 void registerFunctionMultiSearchAllPositionsUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchAllPositionsUTF8>();
 }
 }
--- a/dbms/src/Functions/multiSearchAny.cpp
+++ b/dbms/src/Functions/multiSearchAny.cpp
@ -0,0 +1,22 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAny
 {
    static constexpr auto name = "multiSearchAny";
 };
 using FunctionMultiSearch = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseSensitiveASCII>, NameMultiSearchAny>;
 void registerFunctionMultiSearchAny(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearch>();
 }
 }
--- a/dbms/src/Functions/multiSearchAnyCaseInsensitive.cpp
+++ b/dbms/src/Functions/multiSearchAnyCaseInsensitive.cpp
@ -0,0 +1,22 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAnyCaseInsensitive
 {
    static constexpr auto name = "multiSearchAnyCaseInsensitive";
 };
 using FunctionMultiSearchCaseInsensitive
    = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseInsensitiveASCII>, NameMultiSearchAnyCaseInsensitive>;
 void registerFunctionMultiSearchAnyCaseInsensitive(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchCaseInsensitive>();
 }
 }
--- a/dbms/src/Functions/multiSearchAnyCaseInsensitiveUTF8.cpp
+++ b/dbms/src/Functions/multiSearchAnyCaseInsensitiveUTF8.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAnyCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchAnyCaseInsensitiveUTF8";
 };
 using FunctionMultiSearchCaseInsensitiveUTF8
    = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseInsensitiveUTF8>, NameMultiSearchAnyCaseInsensitiveUTF8>;
 void registerFunctionMultiSearchAnyCaseInsensitiveUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchCaseInsensitiveUTF8>();
 }
 }
--- a/dbms/src/Functions/multiSearchAnyUTF8.cpp
+++ b/dbms/src/Functions/multiSearchAnyUTF8.cpp
@ -0,0 +1,21 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchAnyUTF8
 {
    static constexpr auto name = "multiSearchAnyUTF8";
 };
 using FunctionMultiSearchUTF8 = FunctionsMultiStringSearch<MultiSearchImpl<PositionCaseSensitiveUTF8>, NameMultiSearchAnyUTF8>;
 void registerFunctionMultiSearchAnyUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchUTF8>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstIndex.cpp
+++ b/dbms/src/Functions/multiSearchFirstIndex.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstIndexImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstIndex
 {
    static constexpr auto name = "multiSearchFirstIndex";
 };
 using FunctionMultiSearchFirstIndex
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseSensitiveASCII>, NameMultiSearchFirstIndex>;
 void registerFunctionMultiSearchFirstIndex(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstIndex>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstIndexCaseInsensitive.cpp
+++ b/dbms/src/Functions/multiSearchFirstIndexCaseInsensitive.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstIndexImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstIndexCaseInsensitive
 {
    static constexpr auto name = "multiSearchFirstIndexCaseInsensitive";
 };
 using FunctionMultiSearchFirstIndexCaseInsensitive
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseInsensitiveASCII>, NameMultiSearchFirstIndexCaseInsensitive>;
 void registerFunctionMultiSearchFirstIndexCaseInsensitive(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstIndexCaseInsensitive>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstIndexCaseInsensitiveUTF8.cpp
+++ b/dbms/src/Functions/multiSearchFirstIndexCaseInsensitiveUTF8.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstIndexImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstIndexCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchFirstIndexCaseInsensitiveUTF8";
 };
 using FunctionMultiSearchFirstIndexCaseInsensitiveUTF8
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseInsensitiveUTF8>, NameMultiSearchFirstIndexCaseInsensitiveUTF8>;
 void registerFunctionMultiSearchFirstIndexCaseInsensitiveUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstIndexCaseInsensitiveUTF8>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstIndexUTF8.cpp
+++ b/dbms/src/Functions/multiSearchFirstIndexUTF8.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstIndexImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstIndexUTF8
 {
    static constexpr auto name = "multiSearchFirstIndexUTF8";
 };
 using FunctionMultiSearchFirstIndexUTF8
    = FunctionsMultiStringSearch<MultiSearchFirstIndexImpl<PositionCaseSensitiveUTF8>, NameMultiSearchFirstIndexUTF8>;
 void registerFunctionMultiSearchFirstIndexUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstIndexUTF8>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstPosition.cpp
+++ b/dbms/src/Functions/multiSearchFirstPosition.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstPositionImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstPosition
 {
    static constexpr auto name = "multiSearchFirstPosition";
 };
 using FunctionMultiSearchFirstPosition
    = FunctionsMultiStringSearch<MultiSearchFirstPositionImpl<PositionCaseSensitiveASCII>, NameMultiSearchFirstPosition>;
 void registerFunctionMultiSearchFirstPosition(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstPosition>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstPositionCaseInsensitive.cpp
+++ b/dbms/src/Functions/multiSearchFirstPositionCaseInsensitive.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstPositionImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstPositionCaseInsensitive
 {
    static constexpr auto name = "multiSearchFirstPositionCaseInsensitive";
 };
 using FunctionMultiSearchFirstPositionCaseInsensitive
    = FunctionsMultiStringSearch<MultiSearchFirstPositionImpl<PositionCaseInsensitiveASCII>, NameMultiSearchFirstPositionCaseInsensitive>;
 void registerFunctionMultiSearchFirstPositionCaseInsensitive(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstPositionCaseInsensitive>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstPositionCaseInsensitiveUTF8.cpp
+++ b/dbms/src/Functions/multiSearchFirstPositionCaseInsensitiveUTF8.cpp
@ -0,0 +1,24 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstPositionImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstPositionCaseInsensitiveUTF8
 {
    static constexpr auto name = "multiSearchFirstPositionCaseInsensitiveUTF8";
 };
 using FunctionMultiSearchFirstPositionCaseInsensitiveUTF8 = FunctionsMultiStringSearch<
    MultiSearchFirstPositionImpl<PositionCaseInsensitiveUTF8>,
    NameMultiSearchFirstPositionCaseInsensitiveUTF8>;
 void registerFunctionMultiSearchFirstPositionCaseInsensitiveUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstPositionCaseInsensitiveUTF8>();
 }
 }
--- a/dbms/src/Functions/multiSearchFirstPositionUTF8.cpp
+++ b/dbms/src/Functions/multiSearchFirstPositionUTF8.cpp
@ -0,0 +1,23 @@
 #include "FunctionsMultiStringSearch.h"
 #include "FunctionFactory.h"
 #include "MultiSearchFirstPositionImpl.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NameMultiSearchFirstPositionUTF8
 {
    static constexpr auto name = "multiSearchFirstPositionUTF8";
 };
 using FunctionMultiSearchFirstPositionUTF8
    = FunctionsMultiStringSearch<MultiSearchFirstPositionImpl<PositionCaseSensitiveUTF8>, NameMultiSearchFirstPositionUTF8>;
 void registerFunctionMultiSearchFirstPositionUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionMultiSearchFirstPositionUTF8>();
 }
 }
--- a/dbms/src/Functions/position.cpp
+++ b/dbms/src/Functions/position.cpp
@ -0,0 +1,21 @@
 #include "FunctionsStringSearch.h"
 #include "FunctionFactory.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NamePosition
 {
    static constexpr auto name = "position";
 };
 using FunctionPosition = FunctionsStringSearch<PositionImpl<PositionCaseSensitiveASCII>, NamePosition>;
 void registerFunctionPosition(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionPosition>(FunctionFactory::CaseInsensitive);
    factory.registerAlias("locate", NamePosition::name, FunctionFactory::CaseInsensitive);
 }
 }
--- a/dbms/src/Functions/positionCaseInsensitive.cpp
+++ b/dbms/src/Functions/positionCaseInsensitive.cpp
@ -0,0 +1,20 @@
 #include "FunctionsStringSearch.h"
 #include "FunctionFactory.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NamePositionCaseInsensitive
 {
    static constexpr auto name = "positionCaseInsensitive";
 };
 using FunctionPositionCaseInsensitive = FunctionsStringSearch<PositionImpl<PositionCaseInsensitiveASCII>, NamePositionCaseInsensitive>;
 void registerFunctionPositionCaseInsensitive(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionPositionCaseInsensitive>();
 }
 }
--- a/dbms/src/Functions/positionCaseInsensitiveUTF8.cpp
+++ b/dbms/src/Functions/positionCaseInsensitiveUTF8.cpp
@ -0,0 +1,22 @@
 #include "FunctionsStringSearch.h"
 #include "FunctionFactory.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NamePositionCaseInsensitiveUTF8
 {
    static constexpr auto name = "positionCaseInsensitiveUTF8";
 };
 using FunctionPositionCaseInsensitiveUTF8
    = FunctionsStringSearch<PositionImpl<PositionCaseInsensitiveUTF8>, NamePositionCaseInsensitiveUTF8>;
 void registerFunctionPositionCaseInsensitiveUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionPositionCaseInsensitiveUTF8>();
 }
 }
--- a/dbms/src/Functions/positionUTF8.cpp
+++ b/dbms/src/Functions/positionUTF8.cpp
@ -0,0 +1,21 @@
 #include "FunctionsStringSearch.h"
 #include "FunctionFactory.h"
 #include "PositionImpl.h"
 namespace DB
 {
 struct NamePositionUTF8
 {
    static constexpr auto name = "positionUTF8";
 };
 using FunctionPositionUTF8 = FunctionsStringSearch<PositionImpl<PositionCaseSensitiveUTF8>, NamePositionUTF8>;
 void registerFunctionPositionUTF8(FunctionFactory & factory)
 {
    factory.registerFunction<FunctionPositionUTF8>();
 }
 }
--- a/dbms/src/Functions/registerFunctionsStringSearch.cpp
+++ b/dbms/src/Functions/registerFunctionsStringSearch.cpp
@ -0,0 +1,66 @@
 namespace DB
 {
 class FunctionFactory;
 void registerFunctionPosition(FunctionFactory &);
 void registerFunctionPositionUTF8(FunctionFactory &);
 void registerFunctionPositionCaseInsensitive(FunctionFactory &);
 void registerFunctionPositionCaseInsensitiveUTF8(FunctionFactory &);
 void registerFunctionMultiSearchAny(FunctionFactory &);
 void registerFunctionMultiSearchAnyUTF8(FunctionFactory &);
 void registerFunctionMultiSearchAnyCaseInsensitive(FunctionFactory &);
 void registerFunctionMultiSearchAnyCaseInsensitiveUTF8(FunctionFactory &);
 void registerFunctionMultiSearchFirstIndex(FunctionFactory &);
 void registerFunctionMultiSearchFirstIndexUTF8(FunctionFactory &);
 void registerFunctionMultiSearchFirstIndexCaseInsensitive(FunctionFactory &);
 void registerFunctionMultiSearchFirstIndexCaseInsensitiveUTF8(FunctionFactory &);
 void registerFunctionMultiSearchFirstPosition(FunctionFactory &);
 void registerFunctionMultiSearchFirstPositionUTF8(FunctionFactory &);
 void registerFunctionMultiSearchFirstPositionCaseInsensitive(FunctionFactory &);
 void registerFunctionMultiSearchFirstPositionCaseInsensitiveUTF8(FunctionFactory &);
 void registerFunctionMultiSearchAllPositions(FunctionFactory &);
 void registerFunctionMultiSearchAllPositionsUTF8(FunctionFactory &);
 void registerFunctionMultiSearchAllPositionsCaseInsensitive(FunctionFactory &);
 void registerFunctionMultiSearchAllPositionsCaseInsensitiveUTF8(FunctionFactory &);
 void registerFunctionHasToken(FunctionFactory &);
 void registerFunctionHasTokenCaseInsensitive(FunctionFactory &);
 void registerFunctionsStringSearch(FunctionFactory & factory)
 {
    registerFunctionPosition(factory);
    registerFunctionPositionUTF8(factory);
    registerFunctionPositionCaseInsensitive(factory);
    registerFunctionPositionCaseInsensitiveUTF8(factory);
    registerFunctionMultiSearchAny(factory);
    registerFunctionMultiSearchAnyUTF8(factory);
    registerFunctionMultiSearchAnyCaseInsensitive(factory);
    registerFunctionMultiSearchAnyCaseInsensitiveUTF8(factory);
    registerFunctionMultiSearchFirstIndex(factory);
    registerFunctionMultiSearchFirstIndexUTF8(factory);
    registerFunctionMultiSearchFirstIndexCaseInsensitive(factory);
    registerFunctionMultiSearchFirstIndexCaseInsensitiveUTF8(factory);
    registerFunctionMultiSearchFirstPosition(factory);
    registerFunctionMultiSearchFirstPositionUTF8(factory);
    registerFunctionMultiSearchFirstPositionCaseInsensitive(factory);
    registerFunctionMultiSearchFirstPositionCaseInsensitiveUTF8(factory);
    registerFunctionMultiSearchAllPositions(factory);
    registerFunctionMultiSearchAllPositionsUTF8(factory);
    registerFunctionMultiSearchAllPositionsCaseInsensitive(factory);
    registerFunctionMultiSearchAllPositionsCaseInsensitiveUTF8(factory);
    registerFunctionHasToken(factory);
    registerFunctionHasTokenCaseInsensitive(factory);
 }
 }
--- a/dbms/src/Functions/visitParamExtractRaw.cpp
+++ b/dbms/src/Functions/visitParamExtractRaw.cpp
@ -1,6 +1,6 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsVisitParam.h>
-#include <Functions/FunctionsStringSearch.h>
+#include <Functions/FunctionsStringSearchToString.h>
 namespace DB
--- a/dbms/src/Functions/visitParamExtractString.cpp
+++ b/dbms/src/Functions/visitParamExtractString.cpp
@ -1,6 +1,6 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsVisitParam.h>
-#include <Functions/FunctionsStringSearch.h>
+#include <Functions/FunctionsStringSearchToString.h>
 namespace DB
--- a/dbms/src/Interpreters/ExpressionAnalyzer.cpp
+++ b/dbms/src/Interpreters/ExpressionAnalyzer.cpp
@ -24,7 +24,6 @@
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/ExpressionActions.h>
 #include <Interpreters/InJoinSubqueriesPreprocessor.h>
 #include <Interpreters/LogicalExpressionsOptimizer.h>
 #include <Interpreters/ExternalDictionariesLoader.h>
 #include <Interpreters/Set.h>
--- a/dbms/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
+++ b/dbms/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
@ -38,6 +38,7 @@ struct NonGlobalTableData
    const CheckShardsAndTables & checker;
    const Context & context;
    std::vector<ASTPtr> & renamed_tables;
    ASTFunction * function = nullptr;
    ASTTableJoin * table_join = nullptr;
@ -95,10 +96,11 @@ private:
            String alias = database_and_table->tryGetAlias();
            if (alias.empty())
-                throw Exception("Distributed table should have an alias when distributed_product_mode set to local.",
+                throw Exception("Distributed table should have an alias when distributed_product_mode set to local",
                                ErrorCodes::DISTRIBUTED_IN_JOIN_SUBQUERY_DENIED);
            auto & identifier = database_and_table->as<ASTIdentifier &>();
            renamed_tables.emplace_back(identifier.clone());
            identifier.resetTable(database, table);
        }
        else
@ -118,6 +120,7 @@ public:
    {
        const CheckShardsAndTables & checker;
        const Context & context;
        std::vector<std::pair<ASTPtr, std::vector<ASTPtr>>> & renamed_tables;
    };
    static void visit(ASTPtr & node, Data & data)
@ -148,8 +151,11 @@ private:
        if (node.name == "in" || node.name == "notIn")
        {
            auto & subquery = node.arguments->children.at(1);
-            NonGlobalTableVisitor::Data table_data{data.checker, data.context, &node, nullptr};
+            std::vector<ASTPtr> renamed;
            NonGlobalTableVisitor::Data table_data{data.checker, data.context, renamed, &node, nullptr};
            NonGlobalTableVisitor(table_data).visit(subquery);
            if (!renamed.empty())
                data.renamed_tables.emplace_back(subquery, std::move(renamed));
        }
    }
@ -163,8 +169,11 @@ private:
        {
            if (auto & subquery = node.table_expression->as<ASTTableExpression>()->subquery)
            {
-                NonGlobalTableVisitor::Data table_data{data.checker, data.context, nullptr, table_join};
+                std::vector<ASTPtr> renamed;
                NonGlobalTableVisitor::Data table_data{data.checker, data.context, renamed, nullptr, table_join};
                NonGlobalTableVisitor(table_data).visit(subquery);
                if (!renamed.empty())
                    data.renamed_tables.emplace_back(subquery, std::move(renamed));
            }
        }
    }
@ -208,7 +217,7 @@ void InJoinSubqueriesPreprocessor::visit(ASTPtr & ast) const
            return;
    }
-    NonGlobalSubqueryVisitor::Data visitor_data{*checker, context};
+    NonGlobalSubqueryVisitor::Data visitor_data{*checker, context, renamed_tables};
    NonGlobalSubqueryVisitor(visitor_data).visit(ast);
 }
--- a/dbms/src/Interpreters/InJoinSubqueriesPreprocessor.h
+++ b/dbms/src/Interpreters/InJoinSubqueriesPreprocessor.h
@ -35,6 +35,8 @@ class Context;
 class InJoinSubqueriesPreprocessor
 {
 public:
    using SubqueryTables = std::vector<std::pair<ASTPtr, std::vector<ASTPtr>>>;  /// {subquery, renamed_tables}
    struct CheckShardsAndTables
    {
        using Ptr = std::unique_ptr<CheckShardsAndTables>;
@ -45,8 +47,10 @@ public:
        virtual ~CheckShardsAndTables() {}
    };
-    InJoinSubqueriesPreprocessor(const Context & context_, CheckShardsAndTables::Ptr _checker = std::make_unique<CheckShardsAndTables>())
+    InJoinSubqueriesPreprocessor(const Context & context_, SubqueryTables & renamed_tables_,
                                 CheckShardsAndTables::Ptr _checker = std::make_unique<CheckShardsAndTables>())
        : context(context_)
        , renamed_tables(renamed_tables_)
        , checker(std::move(_checker))
    {}
@ -54,6 +58,7 @@ public:
 private:
    const Context & context;
    SubqueryTables & renamed_tables;
    CheckShardsAndTables::Ptr checker;
 };
--- a/dbms/src/Interpreters/InterpreterAlterQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterAlterQuery.cpp
@ -82,7 +82,7 @@ BlockIO InterpreterAlterQuery::execute()
    if (!mutation_commands.empty())
    {
-        auto table_lock_holder = table->lockStructureForShare(false /* because mutation is executed asyncronously */, context.getCurrentQueryId());
+        auto table_lock_holder = table->lockStructureForShare(context.getCurrentQueryId());
        MutationsInterpreter(table, mutation_commands, context, false).validate(table_lock_holder);
        table->mutate(mutation_commands, context);
    }
@ -101,7 +101,7 @@ BlockIO InterpreterAlterQuery::execute()
            switch (command.type)
            {
                case LiveViewCommand::REFRESH:
-                    live_view->refresh(context);
+                    live_view->refresh();
                    break;
            }
        }
@ -109,7 +109,7 @@ BlockIO InterpreterAlterQuery::execute()
    if (!alter_commands.empty())
    {
-        auto table_lock_holder = table->lockAlterIntention(context.getCurrentQueryId());
+        auto table_lock_holder = table->lockAlterIntention();
        StorageInMemoryMetadata metadata = table->getInMemoryMetadata();
        alter_commands.validate(metadata, context);
        alter_commands.prepare(metadata);
--- a/dbms/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterCreateQuery.cpp
@ -411,7 +411,7 @@ InterpreterCreateQuery::TableProperties InterpreterCreateQuery::setProperties(AS
        StoragePtr as_storage = DatabaseCatalog::instance().getTable({as_database_name, create.as_table});
        /// as_storage->getColumns() and setEngine(...) must be called under structure lock of other_table for CREATE ... AS other_table.
-        as_storage_lock = as_storage->lockStructureForShare(false, context.getCurrentQueryId());
+        as_storage_lock = as_storage->lockStructureForShare(context.getCurrentQueryId());
        properties.columns = as_storage->getColumns();
        /// Secondary indices make sense only for MergeTree family of storage engines.
--- a/dbms/src/Interpreters/InterpreterDescribeQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterDescribeQuery.cpp
@ -89,7 +89,7 @@ BlockInputStreamPtr InterpreterDescribeQuery::executeImpl()
            table = DatabaseCatalog::instance().getTable(table_id);
        }
-        auto table_lock = table->lockStructureForShare(false, context.getInitialQueryId());
+        auto table_lock = table->lockStructureForShare(context.getInitialQueryId());
        columns = table->getColumns();
    }
--- a/dbms/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterInsertQuery.cpp
@ -109,7 +109,7 @@ BlockIO InterpreterInsertQuery::execute()
    BlockIO res;
    StoragePtr table = getTable(query);
-    auto table_lock = table->lockStructureForShare(true, context.getInitialQueryId());
+    auto table_lock = table->lockStructureForShare(context.getInitialQueryId());
    auto query_sample_block = getSampleBlock(query, table);
    if (!query.table_function)
--- a/dbms/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterSelectQuery.cpp
@ -255,7 +255,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(
    if (storage)
    {
-        table_lock = storage->lockStructureForShare(false, context->getInitialQueryId());
+        table_lock = storage->lockStructureForShare(context->getInitialQueryId());
        table_id = storage->getStorageID();
    }
@ -301,6 +301,8 @@ InterpreterSelectQuery::InterpreterSelectQuery(
            source_header = interpreter_subquery->getSampleBlock();
    }
    joined_tables.rewriteDistributedInAndJoins(query_ptr);
    max_streams = settings.max_threads;
    ASTSelectQuery & query = getSelectQuery();
@ -508,7 +510,7 @@ Block InterpreterSelectQuery::getSampleBlockImpl(bool try_move_to_prewhere)
    }
    if (storage && !options.only_analyze)
-        from_stage = storage->getQueryProcessingStage(*context);
+        from_stage = storage->getQueryProcessingStage(*context, query_ptr);
    /// Do I need to perform the first part of the pipeline - running on remote servers during distributed processing.
    bool first_stage = from_stage < QueryProcessingStage::WithMergeableState
@ -1062,7 +1064,7 @@ void InterpreterSelectQuery::executeFetchColumns(
    auto check_trivial_count_query = [&]() -> std::optional<AggregateDescription>
    {
        if (!settings.optimize_trivial_count_query || !syntax_analyzer_result->maybe_optimize_trivial_count || !storage
-            || query.sampleSize() || query.sampleOffset() || query.final() || query.prewhere() || query.where()
+            || query.sampleSize() || query.sampleOffset() || query.final() || query.prewhere() || query.where() || query.groupBy()
            || !query_analyzer->hasAggregation() || processing_stage != QueryProcessingStage::FetchColumns)
            return {};
--- a/dbms/src/Interpreters/JoinedTables.cpp
+++ b/dbms/src/Interpreters/JoinedTables.cpp
@ -1,12 +1,18 @@
 #include <Interpreters/JoinedTables.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/getTableExpressions.h>
 #include <Interpreters/InJoinSubqueriesPreprocessor.h>
 #include <Interpreters/IdentifierSemantic.h>
 #include <Interpreters/InDepthNodeVisitor.h>
 #include <Storages/IStorage.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/StorageValues.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ASTSubquery.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTQualifiedAsterisk.h>
 namespace DB
 {
@ -14,6 +20,7 @@ namespace DB
 namespace ErrorCodes
 {
    extern const int ALIAS_REQUIRED;
    extern const int AMBIGUOUS_COLUMN_NAME;
 }
 namespace
@ -32,6 +39,71 @@ void checkTablesWithColumns(const std::vector<T> & tables_with_columns, const Co
    }
 }
 class RenameQualifiedIdentifiersMatcher
 {
 public:
    using Data = const std::vector<DatabaseAndTableWithAlias>;
    static void visit(ASTPtr & ast, Data & data)
    {
        if (auto * t = ast->as<ASTIdentifier>())
            visit(*t, ast, data);
        if (auto * node = ast->as<ASTQualifiedAsterisk>())
            visit(*node, ast, data);
    }
    static bool needChildVisit(ASTPtr & node, const ASTPtr & child)
    {
        if (node->as<ASTTableExpression>() ||
            node->as<ASTQualifiedAsterisk>() ||
            child->as<ASTSubquery>())
            return false; // NOLINT
        return true;
    }
 private:
    static void visit(ASTIdentifier & identifier, ASTPtr &, Data & data)
    {
        if (identifier.isShort())
            return;
        bool rewritten = false;
        for (auto & table : data)
        {
            /// Table has an alias. We do not need to rewrite qualified names with table alias (match == ColumnMatch::TableName).
            auto match = IdentifierSemantic::canReferColumnToTable(identifier, table);
            if (match == IdentifierSemantic::ColumnMatch::AliasedTableName ||
                match == IdentifierSemantic::ColumnMatch::DbAndTable)
            {
                if (rewritten)
                    throw Exception("Failed to rewrite distributed table names. Ambiguous column '" + identifier.name + "'",
                                    ErrorCodes::AMBIGUOUS_COLUMN_NAME);
                /// Table has an alias. So we set a new name qualified by table alias.
                IdentifierSemantic::setColumnLongName(identifier, table);
                rewritten = true;
            }
        }
    }
    static void visit(const ASTQualifiedAsterisk & node, const ASTPtr &, Data & data)
    {
        ASTIdentifier & identifier = *node.children[0]->as<ASTIdentifier>();
        bool rewritten = false;
        for (auto & table : data)
        {
            if (identifier.name == table.table)
            {
                if (rewritten)
                    throw Exception("Failed to rewrite distributed table. Ambiguous column '" + identifier.name + "'",
                                    ErrorCodes::AMBIGUOUS_COLUMN_NAME);
                identifier.setShortName(table.alias);
                rewritten = true;
            }
        }
    }
 };
 using RenameQualifiedIdentifiersVisitor = InDepthNodeVisitor<RenameQualifiedIdentifiersMatcher, true>;
 }
 JoinedTables::JoinedTables(Context && context_, const ASTSelectQuery & select_query)
@ -114,4 +186,27 @@ void JoinedTables::makeFakeTable(StoragePtr storage, const Block & source_header
        tables_with_columns.emplace_back(DatabaseAndTableWithAlias{}, source_header.getNamesAndTypesList());
 }
 void JoinedTables::rewriteDistributedInAndJoins(ASTPtr & query)
 {
    /// Rewrite IN and/or JOIN for distributed tables according to distributed_product_mode setting.
    InJoinSubqueriesPreprocessor::SubqueryTables renamed_tables;
    InJoinSubqueriesPreprocessor(context, renamed_tables).visit(query);
    String database;
    if (!renamed_tables.empty())
        database = context.getCurrentDatabase();
    for (auto & [subquery, ast_tables] : renamed_tables)
    {
        std::vector<DatabaseAndTableWithAlias> renamed;
        renamed.reserve(ast_tables.size());
        for (auto & ast : ast_tables)
            renamed.emplace_back(DatabaseAndTableWithAlias(*ast->as<ASTIdentifier>(), database));
        /// Change qualified column names in distributed subqueries using table aliases.
        RenameQualifiedIdentifiersVisitor::Data data(renamed);
        RenameQualifiedIdentifiersVisitor(data).visit(subquery);
    }
 }
 }
--- a/dbms/src/Interpreters/JoinedTables.h
+++ b/dbms/src/Interpreters/JoinedTables.h
@ -37,6 +37,8 @@ public:
    const StorageID & leftTableID() const { return table_id; }
    void rewriteDistributedInAndJoins(ASTPtr & query);
    std::unique_ptr<InterpreterSelectWithUnionQuery> makeLeftTableSubquery(const SelectQueryOptions & select_options);
 private:
--- a/dbms/src/Interpreters/MutationsInterpreter.cpp
+++ b/dbms/src/Interpreters/MutationsInterpreter.cpp
@ -558,6 +558,10 @@ ASTPtr MutationsInterpreter::prepareInterpreterSelectQuery(std::vector<Stage> &
            all_asts->children.push_back(std::make_shared<ASTIdentifier>(column));
        auto syntax_result = SyntaxAnalyzer(context).analyze(all_asts, all_columns);
        if (context.hasQueryContext())
            for (const auto & it : syntax_result->getScalars())
                context.getQueryContext().addScalar(it.first, it.second);
        stage.analyzer = std::make_unique<ExpressionAnalyzer>(all_asts, syntax_result, context);
        ExpressionActionsChain & actions_chain = stage.expressions_chain;
--- a/dbms/src/Interpreters/MutationsInterpreter.h
+++ b/dbms/src/Interpreters/MutationsInterpreter.h
@ -47,7 +47,7 @@ private:
    StoragePtr storage;
    MutationCommands commands;
-    const Context & context;
+    Context context;
    bool can_execute;
    ASTPtr mutation_ast;
--- a/dbms/src/Interpreters/SyntaxAnalyzer.cpp
+++ b/dbms/src/Interpreters/SyntaxAnalyzer.cpp
@ -2,7 +2,6 @@
 #include <Core/NamesAndTypes.h>
 #include <Interpreters/SyntaxAnalyzer.h>
 #include <Interpreters/InJoinSubqueriesPreprocessor.h>
 #include <Interpreters/LogicalExpressionsOptimizer.h>
 #include <Interpreters/QueryAliasesVisitor.h>
 #include <Interpreters/InterpreterSelectWithUnionQuery.h>
@ -819,9 +818,6 @@ SyntaxAnalyzerResultPtr SyntaxAnalyzer::analyzeSelect(
    translateQualifiedNames(query, *select_query, source_columns_set, tables_with_column_names);
    /// Rewrite IN and/or JOIN for distributed tables according to distributed_product_mode setting.
    InJoinSubqueriesPreprocessor(context).visit(query);
    /// Optimizes logical expressions.
    LogicalExpressionsOptimizer(select_query, settings.optimize_min_equality_disjunction_chain_length.value).perform();
--- a/dbms/src/Interpreters/SystemLog.cpp
+++ b/dbms/src/Interpreters/SystemLog.cpp
@ -57,7 +57,8 @@ std::shared_ptr<TSystemLog> createSystemLog(
    else
    {
        String partition_by = config.getString(config_prefix + ".partition_by", "toYYYYMM(event_date)");
-        engine = "ENGINE = MergeTree PARTITION BY (" + partition_by + ") ORDER BY (event_date, event_time) SETTINGS index_granularity = 1024";
+        engine = "ENGINE = MergeTree PARTITION BY (" + partition_by + ") ORDER BY (event_date, event_time)"
            "SETTINGS min_bytes_for_wide_part = '10M'"; /// Use polymorphic parts for log tables by default
    }
    size_t flush_interval_milliseconds = config.getUInt64(config_prefix + ".flush_interval_milliseconds", DEFAULT_SYSTEM_LOG_FLUSH_INTERVAL_MILLISECONDS);
--- a/dbms/src/Interpreters/evaluateConstantExpression.cpp
+++ b/dbms/src/Interpreters/evaluateConstantExpression.cpp
@ -101,9 +101,9 @@ namespace
    using Conjunction = ColumnsWithTypeAndName;
    using Disjunction = std::vector<Conjunction>;
-    Disjunction analyzeEquals(const ASTIdentifier * identifier, const ASTLiteral * literal, const ExpressionActionsPtr & expr)
+    Disjunction analyzeEquals(const ASTIdentifier * identifier, const Field & value, const ExpressionActionsPtr & expr)
    {
-        if (!identifier || !literal)
+        if (!identifier || value.isNull())
        {
            return {};
        }
@ -116,10 +116,10 @@ namespace
            if (name == identifier->name)
            {
                ColumnWithTypeAndName column;
-                Field value = convertFieldToType(literal->value, *type);
+                Field converted = convertFieldToType(value, *type);
-                if (!literal->value.isNull() && value.isNull())
+                if (converted.isNull())
                    return {};
-                column.column = type->createColumnConst(1, value);
+                column.column = type->createColumnConst(1, converted);
                column.name = name;
                column.type = type;
                return {{std::move(column)}};
@ -129,6 +129,16 @@ namespace
        return {};
    }
    Disjunction analyzeEquals(const ASTIdentifier * identifier, const ASTLiteral * literal, const ExpressionActionsPtr & expr)
    {
        if (!identifier || !literal)
        {
            return {};
        }
        return analyzeEquals(identifier, literal->value, expr);
    }
    Disjunction andDNF(const Disjunction & left, const Disjunction & right)
    {
        if (left.empty())
@ -174,33 +184,44 @@ namespace
            const auto * left = fn->arguments->children.front().get();
            const auto * right = fn->arguments->children.back().get();
            const auto * identifier = left->as<ASTIdentifier>();
            const auto * inner_fn = right->as<ASTFunction>();
            if (!inner_fn)
            {
                return {};
            }
            const auto * tuple = inner_fn->children.front()->as<ASTExpressionList>();
            if (!tuple)
            {
                return {};
            }
            Disjunction result;
-            for (const auto & child : tuple->children)
+            if (const auto * tuple_func = right->as<ASTFunction>(); tuple_func && tuple_func->name == "tuple")
            {
-                const auto * literal = child->as<ASTLiteral>();
+                const auto * tuple_elements = tuple_func->children.front()->as<ASTExpressionList>();
-                const auto dnf = analyzeEquals(identifier, literal, expr);
+                for (const auto & child : tuple_elements->children)
                if (dnf.empty())
                {
-                    return {};
+                    const auto * literal = child->as<ASTLiteral>();
-                }
+                    const auto dnf = analyzeEquals(identifier, literal, expr);
-                result.insert(result.end(), dnf.begin(), dnf.end());
+                    if (dnf.empty())
                    {
                        return {};
                    }
                    result.insert(result.end(), dnf.begin(), dnf.end());
                }
            }
            else if (const auto * tuple_literal = right->as<ASTLiteral>();
                tuple_literal && tuple_literal->value.getType() == Field::Types::Tuple)
            {
                const auto & tuple = tuple_literal->value.get<const Tuple &>();
                for (const auto & child : tuple)
                {
                    const auto dnf = analyzeEquals(identifier, child, expr);
                    if (dnf.empty())
                    {
                        return {};
                    }
                    result.insert(result.end(), dnf.begin(), dnf.end());
                }
            }
            else
            {
                return {};
            }
            return result;
--- a/dbms/src/Interpreters/executeQuery.cpp
+++ b/dbms/src/Interpreters/executeQuery.cpp
@ -41,6 +41,7 @@
 #include <Processors/Formats/IOutputFormat.h>
 #include <Parsers/ASTWatchQuery.h>
 namespace ProfileEvents
 {
    extern const Event QueryMaskingRulesMatch;
--- a/dbms/src/Interpreters/executeQuery.h
+++ b/dbms/src/Interpreters/executeQuery.h
@ -38,7 +38,7 @@ void executeQuery(
 /// Correctly formatting the results (according to INTO OUTFILE and FORMAT sections)
 /// must be done separately.
 BlockIO executeQuery(
-    const String & query,    /// Query text without INSERT data. The latter must be written to BlockIO::out.
+    const String & query,     /// Query text without INSERT data. The latter must be written to BlockIO::out.
    Context & context,        /// DB, tables, data types, storage engines, functions, aggregate functions...
    bool internal = false,    /// If true, this query is caused by another query and thus needn't be registered in the ProcessList.
    QueryProcessingStage::Enum stage = QueryProcessingStage::Complete,    /// To which stage the query must be executed.
@ -48,7 +48,7 @@ BlockIO executeQuery(
 QueryPipeline executeQueryWithProcessors(
-    const String & query,    /// Query text without INSERT data. The latter must be written to BlockIO::out.
+    const String & query,     /// Query text without INSERT data. The latter must be written to BlockIO::out.
    Context & context,        /// DB, tables, data types, storage engines, functions, aggregate functions...
    bool internal = false,    /// If true, this query is caused by another query and thus needn't be registered in the ProcessList.
    QueryProcessingStage::Enum stage = QueryProcessingStage::Complete,    /// To which stage the query must be executed.
--- a/dbms/src/Interpreters/tests/in_join_subqueries_preprocessor.cpp
+++ b/dbms/src/Interpreters/tests/in_join_subqueries_preprocessor.cpp
@ -1181,7 +1181,8 @@ TestResult check(const TestEntry & entry)
        try
        {
-            DB::InJoinSubqueriesPreprocessor(context, std::make_unique<CheckShardsAndTablesMock>()).visit(ast_input);
+            DB::InJoinSubqueriesPreprocessor::SubqueryTables renamed;
            DB::InJoinSubqueriesPreprocessor(context, renamed, std::make_unique<CheckShardsAndTablesMock>()).visit(ast_input);
        }
        catch (const DB::Exception & ex)
        {
--- a/dbms/src/Parsers/ASTLiteral.cpp
+++ b/dbms/src/Parsers/ASTLiteral.cpp
@ -16,17 +16,21 @@ void ASTLiteral::updateTreeHashImpl(SipHash & hash_state) const
 void ASTLiteral::appendColumnNameImpl(WriteBuffer & ostr) const
 {
-    /// Special case for very large arrays. Instead of listing all elements, will use hash of them.
+    /// 100 - just arbitrary value.
    constexpr auto min_elements_for_hashing = 100;
    /// Special case for very large arrays and tuples. Instead of listing all elements, will use hash of them.
    /// (Otherwise column name will be too long, that will lead to significant slowdown of expression analysis.)
-    if (value.getType() == Field::Types::Array
+    auto type = value.getType();
-        && value.get<const Array &>().size() > 100)        /// 100 - just arbitrary value.
+    if ((type == Field::Types::Array && value.get<const Array &>().size() > min_elements_for_hashing)
        || (type == Field::Types::Tuple && value.get<const Tuple &>().size() > min_elements_for_hashing))
    {
        SipHash hash;
        applyVisitor(FieldVisitorHash(hash), value);
        UInt64 low, high;
        hash.get128(low, high);
-        writeCString("__array_", ostr);
+        writeCString(type == Field::Types::Array ? "__array_" : "__tuple_", ostr);
        writeText(low, ostr);
        ostr.write('_');
        writeText(high, ostr);
--- a/dbms/src/Parsers/ExpressionElementParsers.cpp
+++ b/dbms/src/Parsers/ExpressionElementParsers.cpp
@ -1026,27 +1026,31 @@ bool ParserStringLiteral::parseImpl(Pos & pos, ASTPtr & node, Expected & expecte
    return true;
 }
-
+template <typename Collection>
-bool ParserArrayOfLiterals::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
+bool ParserCollectionOfLiterals<Collection>::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (pos->type != TokenType::OpeningSquareBracket)
+    if (pos->type != opening_bracket)
        return false;
    Pos literal_begin = pos;
-    Array arr;
+    Collection arr;
    ParserLiteral literal_p;
    ++pos;
    while (pos.isValid())
    {
        if (!arr.empty())
        {
-            if (pos->type == TokenType::ClosingSquareBracket)
+            if (pos->type == closing_bracket)
            {
-                auto literal = std::make_shared<ASTLiteral>(arr);
+                std::shared_ptr<ASTLiteral> literal;
                /// Parse one-element tuples (e.g. (1)) later as single values for backward compatibility.
                if (std::is_same_v<Collection, Tuple> && arr.size() == 1)
                    return false;
                literal = std::make_shared<ASTLiteral>(arr);
                literal->begin = literal_begin;
                literal->end = ++pos;
                node = literal;
@ -1058,7 +1062,8 @@ bool ParserArrayOfLiterals::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
            }
            else
            {
-                expected.add(pos, "comma or closing square bracket");
+                String message = String("comma or ") + getTokenName(closing_bracket);
                expected.add(pos, message.c_str());
                return false;
            }
        }
@ -1070,7 +1075,7 @@ bool ParserArrayOfLiterals::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
        arr.push_back(literal_node->as<ASTLiteral &>().value);
    }
-    expected.add(pos, "closing square bracket");
+    expected.add(pos, getTokenName(closing_bracket));
    return false;
 }
@ -1271,6 +1276,7 @@ bool ParserSubstitution::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
 bool ParserExpressionElement::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
    return ParserSubquery().parse(pos, node, expected)
        || ParserTupleOfLiterals().parse(pos, node, expected)
        || ParserParenthesisExpression().parse(pos, node, expected)
        || ParserArrayOfLiterals().parse(pos, node, expected)
        || ParserArray().parse(pos, node, expected)
--- a/dbms/src/Parsers/ExpressionElementParsers.h
+++ b/dbms/src/Parsers/ExpressionElementParsers.h
@ -1,5 +1,6 @@
 #pragma once
 #include <Core/Field.h>
 #include <Parsers/IParserBase.h>
@ -223,17 +224,50 @@ protected:
 };
-/** An array of literals.
+/** An array or tuple of literals.
-  * Arrays can also be parsed as an application of [] operator.
+  * Arrays can also be parsed as an application of [] operator and tuples as an application of 'tuple' function.
-  * But parsing the whole array as a whole constant seriously speeds up the analysis of expressions in the case of very large arrays.
+  * But parsing the whole array/tuple as a whole constant seriously speeds up the analysis of expressions in the case of very large collection.
-  * We try to parse the array as an array of literals first (fast path),
+  * We try to parse the array or tuple as a collection of literals first (fast path),
-  *  and if it did not work out (when the array consists of complex expressions) - parse as an application of [] operator (slow path).
+  *  and if it did not work out (when the collection consists of complex expressions) -
  *  parse as an application of [] operator or 'tuple' function (slow path).
  */
 template <typename Collection>
 class ParserCollectionOfLiterals : public IParserBase
 {
 public:
    ParserCollectionOfLiterals(TokenType opening_bracket_, TokenType closing_bracket_)
        : opening_bracket(opening_bracket_), closing_bracket(closing_bracket_) {}
 protected:
    const char * getName() const override { return "collection of literals"; }
    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
 private:
    TokenType opening_bracket;
    TokenType closing_bracket;
 };
 /// A tuple of literals with same type.
 class ParserTupleOfLiterals : public IParserBase
 {
 public:
    ParserCollectionOfLiterals<Tuple> tuple_parser{TokenType::OpeningRoundBracket, TokenType::ClosingRoundBracket};
 protected:
    const char * getName() const override { return "tuple"; }
    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override
    {
        return tuple_parser.parse(pos, node, expected);
    }
 };
 class ParserArrayOfLiterals : public IParserBase
 {
 public:
    ParserCollectionOfLiterals<Array> array_parser{TokenType::OpeningSquareBracket, TokenType::ClosingSquareBracket};
 protected:
    const char * getName() const override { return "array"; }
-    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
+    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override
    {
        return array_parser.parse(pos, node, expected);
    }
 };
--- a/dbms/src/Parsers/ParserCreateUserQuery.cpp
+++ b/dbms/src/Parsers/ParserCreateUserQuery.cpp
@ -4,6 +4,7 @@
 #include <Parsers/parseUserName.h>
 #include <Parsers/parseIdentifierOrStringLiteral.h>
 #include <Parsers/ExpressionElementParsers.h>
 #include <Parsers/ExpressionListParsers.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTExtendedRoleSet.h>
 #include <Parsers/ParserExtendedRoleSet.h>
@ -168,34 +169,38 @@ namespace
                else if (ParserKeyword{"NAME REGEXP"}.ignore(pos, expected))
                {
                    ASTPtr ast;
-                    if (!ParserStringLiteral{}.parse(pos, ast, expected))
+                    if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
                        return false;
-                    new_hosts.addNameRegexp(ast->as<const ASTLiteral &>().value.safeGet<String>());
+                    for (const auto & name_regexp_ast : ast->children)
                        new_hosts.addNameRegexp(name_regexp_ast->as<const ASTLiteral &>().value.safeGet<String>());
                }
                else if (ParserKeyword{"NAME"}.ignore(pos, expected))
                {
                    ASTPtr ast;
-                    if (!ParserStringLiteral{}.parse(pos, ast, expected))
+                    if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
                        return false;
-                    new_hosts.addName(ast->as<const ASTLiteral &>().value.safeGet<String>());
+                    for (const auto & name_ast : ast->children)
                        new_hosts.addName(name_ast->as<const ASTLiteral &>().value.safeGet<String>());
                }
                else if (ParserKeyword{"IP"}.ignore(pos, expected))
                {
                    ASTPtr ast;
-                    if (!ParserStringLiteral{}.parse(pos, ast, expected))
+                    if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
                        return false;
-                    new_hosts.addSubnet(ast->as<const ASTLiteral &>().value.safeGet<String>());
+                    for (const auto & subnet_ast : ast->children)
                        new_hosts.addSubnet(subnet_ast->as<const ASTLiteral &>().value.safeGet<String>());
                }
                else if (ParserKeyword{"LIKE"}.ignore(pos, expected))
                {
                    ASTPtr ast;
-                    if (!ParserStringLiteral{}.parse(pos, ast, expected))
+                    if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
                        return false;
-                    new_hosts.addLikePattern(ast->as<const ASTLiteral &>().value.safeGet<String>());
+                    for (const auto & pattern_ast : ast->children)
                        new_hosts.addLikePattern(pattern_ast->as<const ASTLiteral &>().value.safeGet<String>());
                }
                else
                    return false;
--- a/dbms/src/Parsers/ParserPartition.cpp
+++ b/dbms/src/Parsers/ParserPartition.cpp
@ -38,14 +38,34 @@ bool ParserPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
        String fields_str;
        const auto * tuple_ast = value->as<ASTFunction>();
        bool surrounded_by_parens = false;
        if (tuple_ast && tuple_ast->name == "tuple")
        {
            surrounded_by_parens = true;
            const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
            if (arguments_ast)
                fields_count = arguments_ast->children.size();
            else
                fields_count = 0;
        }
        else if (auto literal = value->as<ASTLiteral>())
        {
            if (literal->value.getType() == Field::Types::Tuple)
            {
                surrounded_by_parens = true;
                fields_count = literal->value.get<Tuple &>().size();
            }
            else
            {
                fields_count = 1;
                fields_str = String(begin->begin, pos->begin - begin->begin);
            }
        }
        else
            return false;
        if (surrounded_by_parens)
        {
            Pos left_paren = begin;
            Pos right_paren = pos;
@ -61,13 +81,6 @@ bool ParserPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
            fields_str = String(left_paren->end, right_paren->begin - left_paren->end);
        }
        else if (value->as<ASTLiteral>())
        {
            fields_count = 1;
            fields_str = String(begin->begin, pos->begin - begin->begin);
        }
        else
            return false;
        partition->value = value;
        partition->children.push_back(value);
--- a/dbms/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
+++ b/dbms/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
@ -30,13 +30,27 @@ namespace ErrorCodes
    extern const int SYNTAX_ERROR;
 }
 struct SpecialParserType
 {
-    bool is_array = false;
+    SpecialParserType() = default;
-    bool is_nullable = false;
+    explicit SpecialParserType(Field::Types::Which main_type_) : main_type(main_type_) {}
    Field::Types::Which nested_type = Field::Types::Which::String;
-    bool useDefaultParser() const { return nested_type == Field::Types::Which::String; }
+    Field::Types::Which main_type = Field::Types::String;
    bool is_nullable = false;
    bool is_array = false;
    bool is_tuple = false;
    /// Type and nullability
    std::vector<std::pair<Field::Types::Which, bool>> nested_types;
    bool useDefaultParser() const
    {
        return main_type == Field::Types::String || (!nested_types.empty()
            && std::all_of(
                nested_types.begin(),
                nested_types.end(),
                [](const auto & type) { return type.first == Field::Types::String; }));
    }
 };
 struct LiteralInfo
@ -54,6 +68,54 @@ struct LiteralInfo
    SpecialParserType special_parser;
 };
 static void fillLiteralInfo(DataTypes & nested_types, LiteralInfo & info)
 {
    size_t elements_num = nested_types.size();
    info.special_parser.nested_types.reserve(elements_num);
    for (auto nested_type : nested_types)
    {
        /// It can be Array(Nullable(nested_type)) or Tuple(..., Nullable(nested_type), ...)
        bool is_nullable = false;
        if (auto nullable = dynamic_cast<const DataTypeNullable *>(nested_type.get()))
        {
            nested_type = nullable->getNestedType();
            is_nullable = true;
        }
        WhichDataType type_info{nested_type};
        Field::Types::Which field_type;
        /// Promote integers to 64 bit types
        if (type_info.isNativeUInt())
        {
            nested_type = std::make_shared<DataTypeUInt64>();
            field_type = Field::Types::UInt64;
        }
        else if (type_info.isNativeInt())
        {
            nested_type = std::make_shared<DataTypeInt64>();
            field_type = Field::Types::Int64;
        }
        else if (type_info.isFloat64())
        {
            field_type = Field::Types::Float64;
        }
        else if (type_info.isString())
        {
            field_type = Field::Types::String;
        }
        else
            throw Exception("Unexpected literal type inside Array: " + nested_type->getName() + ". It's a bug",
                            ErrorCodes::LOGICAL_ERROR);
        if (is_nullable)
            nested_type = std::make_shared<DataTypeNullable>(nested_type);
        info.special_parser.nested_types.emplace_back(field_type, is_nullable);
    }
 }
 /// Extracts ASTLiterals from expression, replaces them with ASTIdentifiers where needed
 /// and deduces data types for dummy columns by field type of literal
 class ReplaceLiteralsVisitor
@ -137,7 +199,7 @@ private:
        /// We have to use ParserNumber instead of type->deserializeAsTextQuoted() for arithmetic types
        /// to check actual type of literal and avoid possible overflow and precision issues.
-        info.special_parser = SpecialParserType{false, false, field_type};
+        info.special_parser = SpecialParserType(field_type);
        /// Do not use 8, 16 and 32 bit types, so template will match all integers
        if (field_type == Field::Types::UInt64)
@ -152,47 +214,17 @@ private:
        {
            info.special_parser.is_array = true;
            info.type = applyVisitor(FieldToDataType(), info.literal->value);
-            auto nested_type = assert_cast<const DataTypeArray &>(*info.type).getNestedType();
+            DataTypes nested_types = { assert_cast<const DataTypeArray &>(*info.type).getNestedType() };
-
+            fillLiteralInfo(nested_types, info);
-            /// It can be Array(Nullable(nested_type))
+            info.type = std::make_shared<DataTypeArray>(nested_types[0]);
-            bool array_of_nullable = false;
+        }
-            if (auto nullable = dynamic_cast<const DataTypeNullable *>(nested_type.get()))
+        else if (field_type == Field::Types::Tuple)
-            {
+        {
-                nested_type = nullable->getNestedType();
+            info.special_parser.is_tuple = true;
-                array_of_nullable = true;
+            info.type = applyVisitor(FieldToDataType(), info.literal->value);
-            }
+            auto nested_types = assert_cast<const DataTypeTuple &>(*info.type).getElements();
-
+            fillLiteralInfo(nested_types, info);
-            WhichDataType type_info{nested_type};
+            info.type = std::make_shared<DataTypeTuple>(nested_types);
            /// Promote integers to 64 bit types
            if (type_info.isNativeUInt())
            {
                nested_type = std::make_shared<DataTypeUInt64>();
                info.special_parser.nested_type = Field::Types::UInt64;
            }
            else if (type_info.isNativeInt())
            {
                nested_type = std::make_shared<DataTypeInt64>();
                info.special_parser.nested_type = Field::Types::Int64;
            }
            else if (type_info.isFloat64())
            {
                info.special_parser.nested_type = Field::Types::Float64;
            }
            else if (type_info.isString())
            {
                info.special_parser.nested_type = Field::Types::String;
            }
            else
                throw Exception("Unexpected literal type inside Array: " + nested_type->getName() + ". It's a bug",
                                ErrorCodes::LOGICAL_ERROR);
            if (array_of_nullable)
            {
                nested_type = std::make_shared<DataTypeNullable>(nested_type);
                info.special_parser.is_nullable = true;
            }
            info.type = std::make_shared<DataTypeArray>(nested_type);
        }
        else
            throw Exception(String("Unexpected literal type ") + info.literal->value.getTypeName() + ". It's a bug",
@ -404,36 +436,50 @@ bool ConstantExpressionTemplate::parseLiteralAndAssertType(ReadBuffer & istr, co
    /// If literal does not fit entirely in the buffer, parsing error will happen.
    /// However, it's possible to deduce new template (or use template from cache) after error like it was template mismatch.
-    if (type_info.is_array)
+    if (type_info.is_array || type_info.is_tuple)
    {
        /// TODO faster way to check types without using Parsers
        ParserArrayOfLiterals parser_array;
        ParserTupleOfLiterals parser_tuple;
        Tokens tokens_number(istr.position(), istr.buffer().end());
        IParser::Pos iterator(tokens_number, settings.max_parser_depth);
        Expected expected;
        ASTPtr ast;
-
+        if (!parser_array.parse(iterator, ast, expected) && !parser_tuple.parse(iterator, ast, expected))
        if (!parser_array.parse(iterator, ast, expected))
            return false;
        istr.position() = const_cast<char *>(iterator->begin);
-        const Field & array = ast->as<ASTLiteral &>().value;
+        const Field & collection = ast->as<ASTLiteral &>().value;
-        auto array_type = applyVisitor(FieldToDataType(), array);
+        auto collection_type = applyVisitor(FieldToDataType(), collection);
        auto nested_type = assert_cast<const DataTypeArray &>(*array_type).getNestedType();
        if (type_info.is_nullable)
            if (auto nullable = dynamic_cast<const DataTypeNullable *>(nested_type.get()))
                nested_type = nullable->getNestedType();
-        WhichDataType nested_type_info(nested_type);
+        DataTypes nested_types;
-        if ((nested_type_info.isNativeUInt() && type_info.nested_type == Type::UInt64) ||
+        if (type_info.is_array)
-            (nested_type_info.isNativeInt()  && type_info.nested_type == Type::Int64)  ||
+            nested_types = { assert_cast<const DataTypeArray &>(*collection_type).getNestedType() };
-            (nested_type_info.isFloat64()    && type_info.nested_type == Type::Float64))
+        else
            nested_types = assert_cast<const DataTypeTuple &>(*collection_type).getElements();
        for (size_t i = 0; i < nested_types.size(); ++i)
        {
-            Field array_same_types = convertFieldToType(array, *complex_type, nullptr);
+            const auto & [nested_field_type, is_nullable] = type_info.nested_types[i];
-            columns[column_idx]->insert(array_same_types);
+            if (is_nullable)
-            return true;
+                if (auto nullable = dynamic_cast<const DataTypeNullable *>(nested_types[i].get()))
                    nested_types[i] = nullable->getNestedType();
            WhichDataType nested_type_info(nested_types[i]);
            bool are_types_compatible =
                (nested_type_info.isNativeUInt() && nested_field_type == Type::UInt64) ||
                (nested_type_info.isNativeInt()  && nested_field_type == Type::Int64)  ||
                (nested_type_info.isFloat64()    && nested_field_type == Type::Float64);
            if (!are_types_compatible)
                return false;
        }
-        return false;
+
        Field array_same_types = convertFieldToType(collection, *complex_type, nullptr);
        columns[column_idx]->insert(array_same_types);
        return true;
    }
    else
    {
@ -470,14 +516,14 @@ bool ConstantExpressionTemplate::parseLiteralAndAssertType(ReadBuffer & istr, co
            if (pos_integer == pos_double && errno != ERANGE && (!negative || uint_value <= (1ULL << 63)))
            {
                istr.position() += pos_integer - buf;
-                if (negative && type_info.nested_type == Type::Int64)
+                if (negative && type_info.main_type == Type::Int64)
                    number = static_cast<Int64>(-uint_value);
-                else if (!negative && type_info.nested_type == Type::UInt64)
+                else if (!negative && type_info.main_type == Type::UInt64)
                    number = uint_value;
                else
                    return false;
            }
-            else if (type_info.nested_type == Type::Float64)
+            else if (type_info.main_type == Type::Float64)
            {
                istr.position() += pos_double - buf;
                number = float_value;
--- a/dbms/src/Processors/Formats/Impl/RegexpRowInputFormat.cpp
+++ b/dbms/src/Processors/Formats/Impl/RegexpRowInputFormat.cpp
@ -0,0 +1,195 @@
 #include <stdlib.h>
 #include <common/find_symbols.h>
 #include <Processors/Formats/Impl/RegexpRowInputFormat.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <IO/ReadHelpers.h>
 namespace DB
 {
 namespace ErrorCodes
 {
    extern const int INCORRECT_DATA;
    extern const int BAD_ARGUMENTS;
 }
 RegexpRowInputFormat::RegexpRowInputFormat(
        ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_)
        : IRowInputFormat(header_, in_, std::move(params_)), buf(in_), format_settings(format_settings_), regexp(format_settings_.regexp.regexp)
 {
    size_t fields_count = regexp.NumberOfCapturingGroups();
    matched_fields.resize(fields_count);
    re2_arguments.resize(fields_count);
    re2_arguments_ptrs.resize(fields_count);
    for (size_t i = 0; i != fields_count; ++i)
    {
        // Bind an argument to a matched field.
        re2_arguments[i] = &matched_fields[i];
        // Save pointer to argument.
        re2_arguments_ptrs[i] = &re2_arguments[i];
    }
    field_format = stringToFormat(format_settings_.regexp.escaping_rule);
 }
 RegexpRowInputFormat::ColumnFormat RegexpRowInputFormat::stringToFormat(const String & format)
 {
    if (format == "Escaped")
        return ColumnFormat::Escaped;
    if (format == "Quoted")
        return ColumnFormat::Quoted;
    if (format == "CSV")
        return ColumnFormat::Csv;
    if (format == "JSON")
        return ColumnFormat::Json;
    throw Exception("Unsupported column format \"" + format + "\".", ErrorCodes::BAD_ARGUMENTS);
 }
 bool RegexpRowInputFormat::readField(size_t index, MutableColumns & columns)
 {
    const auto & type = getPort().getHeader().getByPosition(index).type;
    bool parse_as_nullable = format_settings.null_as_default && !type->isNullable();
    bool read = true;
    ReadBuffer field_buf(const_cast<char *>(matched_fields[index].data()), matched_fields[index].size(), 0);
    try
    {
        switch (field_format)
        {
            case ColumnFormat::Escaped:
                if (parse_as_nullable)
                    read = DataTypeNullable::deserializeTextEscaped(*columns[index], field_buf, format_settings, type);
                else
                    type->deserializeAsTextEscaped(*columns[index], field_buf, format_settings);
                break;
            case ColumnFormat::Quoted:
                if (parse_as_nullable)
                    read = DataTypeNullable::deserializeTextQuoted(*columns[index], field_buf, format_settings, type);
                else
                    type->deserializeAsTextQuoted(*columns[index], field_buf, format_settings);
                break;
            case ColumnFormat::Csv:
                if (parse_as_nullable)
                    read = DataTypeNullable::deserializeTextCSV(*columns[index], field_buf, format_settings, type);
                else
                    type->deserializeAsTextCSV(*columns[index], field_buf, format_settings);
                break;
            case ColumnFormat::Json:
                if (parse_as_nullable)
                    read = DataTypeNullable::deserializeTextJSON(*columns[index], field_buf, format_settings, type);
                else
                    type->deserializeAsTextJSON(*columns[index], field_buf, format_settings);
                break;
            default:
                break;
        }
    }
    catch (Exception & e)
    {
        e.addMessage("(while read the value of column " +  getPort().getHeader().getByPosition(index).name + ")");
        throw;
    }
    return read;
 }
 void RegexpRowInputFormat::readFieldsFromMatch(MutableColumns & columns, RowReadExtension & ext)
 {
    if (matched_fields.size() != columns.size())
        throw Exception("The number of matched fields in line doesn't match the number of columns.", ErrorCodes::INCORRECT_DATA);
    ext.read_columns.assign(columns.size(), false);
    for (size_t columns_index = 0; columns_index < columns.size(); ++columns_index)
    {
        ext.read_columns[columns_index] = readField(columns_index, columns);
    }
 }
 bool RegexpRowInputFormat::readRow(MutableColumns & columns, RowReadExtension & ext)
 {
    if (buf.eof())
        return false;
    PeekableReadBufferCheckpoint checkpoint{buf};
    size_t line_size = 0;
    do
    {
        char * pos = find_first_symbols<'\n', '\r'>(buf.position(), buf.buffer().end());
        line_size += pos - buf.position();
        buf.position() = pos;
    } while (buf.position() == buf.buffer().end() && !buf.eof());
    buf.makeContinuousMemoryFromCheckpointToPos();
    buf.rollbackToCheckpoint();
    bool match = RE2::FullMatchN(re2::StringPiece(buf.position(), line_size), regexp, re2_arguments_ptrs.data(), re2_arguments_ptrs.size());
    bool read_line = true;
    if (!match)
    {
        if (!format_settings.regexp.skip_unmatched)
            throw Exception("Line \"" + std::string(buf.position(), line_size) + "\" doesn't match the regexp.", ErrorCodes::INCORRECT_DATA);
        read_line = false;
    }
    if (read_line)
        readFieldsFromMatch(columns, ext);
    buf.position() += line_size;
    checkChar('\r', buf);
    if (!buf.eof() && !checkChar('\n', buf))
        throw Exception("No \\n after \\r at the end of line.", ErrorCodes::INCORRECT_DATA);
    return true;
 }
 void registerInputFormatProcessorRegexp(FormatFactory & factory)
 {
    factory.registerInputFormatProcessor("Regexp", [](
            ReadBuffer & buf,
            const Block & sample,
            IRowInputFormat::Params params,
            const FormatSettings & settings)
    {
        return std::make_shared<RegexpRowInputFormat>(buf, sample, std::move(params), settings);
    });
 }
 static bool fileSegmentationEngineRegexpImpl(ReadBuffer & in, DB::Memory<> & memory, size_t min_chunk_size)
 {
    char * pos = in.position();
    bool need_more_data = true;
    while (loadAtPosition(in, memory, pos) && need_more_data)
    {
        pos = find_first_symbols<'\n', '\r'>(pos, in.buffer().end());
        if (pos == in.buffer().end())
            continue;
        // Support DOS-style newline ("\r\n")
        if (*pos == '\r')
        {
            ++pos;
            if (pos == in.buffer().end())
                loadAtPosition(in, memory, pos);
        }
        if (memory.size() + static_cast<size_t>(pos - in.position()) >= min_chunk_size)
            need_more_data = false;
        ++pos;
    }
    saveUpToPosition(in, memory, pos);
    return loadAtPosition(in, memory, pos);
 }
 void registerFileSegmentationEngineRegexp(FormatFactory & factory)
 {
    factory.registerFileSegmentationEngine("Regexp", &fileSegmentationEngineRegexpImpl);
 }
 }
--- a/dbms/src/Processors/Formats/Impl/RegexpRowInputFormat.h
+++ b/dbms/src/Processors/Formats/Impl/RegexpRowInputFormat.h
@ -0,0 +1,53 @@
 #pragma once
 #include <re2/re2.h>
 #include <re2/stringpiece.h>
 #include <string>
 #include <vector>
 #include <Core/Block.h>
 #include <Processors/Formats/IRowInputFormat.h>
 #include <Formats/FormatSettings.h>
 #include <Formats/FormatFactory.h>
 #include <IO/PeekableReadBuffer.h>
 #include <Formats/ParsedTemplateFormatString.h>
 namespace DB
 {
 class ReadBuffer;
 /// Regexp input format.
 /// This format applies regular expression from format_regexp setting for every line of file
 /// (the lines must be separated by newline character ('\n') or DOS-style newline ("\r\n")).
 /// Every matched subpattern will be parsed with the method of corresponding data type
 /// (according to format_regexp_escaping_rule setting). If the regexp did not match the line,
 /// if format_regexp_skip_unmatched is 1, the line is silently skipped, if the setting is 0, exception will be thrown.
 class RegexpRowInputFormat : public IRowInputFormat
 {
    using ColumnFormat = ParsedTemplateFormatString::ColumnFormat;
 public:
    RegexpRowInputFormat(ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_);
    String getName() const override { return "RegexpRowInputFormat"; }
    bool readRow(MutableColumns & columns, RowReadExtension & ext) override;
 private:
    bool readField(size_t index, MutableColumns & columns);
    void readFieldsFromMatch(MutableColumns & columns, RowReadExtension & ext);
    static ColumnFormat stringToFormat(const String & format);
    PeekableReadBuffer buf;
    const FormatSettings format_settings;
    ColumnFormat field_format;
    RE2 regexp;
    // The vector of fields extracted from line using regexp.
    std::vector<re2::StringPiece> matched_fields;
    // These two vectors are needed to use RE2::FullMatchN (function for extracting fields).
    std::vector<RE2::Arg> re2_arguments;
    std::vector<RE2::Arg *> re2_arguments_ptrs;
 };
 }
--- a/dbms/src/Storages/IStorage.cpp
+++ b/dbms/src/Storages/IStorage.cpp
@ -314,11 +314,9 @@ bool IStorage::isVirtualColumn(const String & column_name) const
    return getColumns().get(column_name).is_virtual;
 }
-TableStructureReadLockHolder IStorage::lockStructureForShare(bool will_add_new_data, const String & query_id)
+TableStructureReadLockHolder IStorage::lockStructureForShare(const String & query_id)
 {
    TableStructureReadLockHolder result;
    if (will_add_new_data)
        result.new_data_structure_lock = new_data_structure_lock->getLock(RWLockImpl::Read, query_id);
    result.structure_lock = structure_lock->getLock(RWLockImpl::Read, query_id);
    if (is_dropped)
@ -326,43 +324,32 @@ TableStructureReadLockHolder IStorage::lockStructureForShare(bool will_add_new_d
    return result;
 }
-TableStructureWriteLockHolder IStorage::lockAlterIntention(const String & query_id)
+TableStructureWriteLockHolder IStorage::lockAlterIntention()
 {
    TableStructureWriteLockHolder result;
-    result.alter_intention_lock = alter_intention_lock->getLock(RWLockImpl::Write, query_id);
+    result.alter_lock = std::unique_lock(alter_lock);
    if (is_dropped)
        throw Exception("Table is dropped", ErrorCodes::TABLE_IS_DROPPED);
    return result;
 }
 void IStorage::lockNewDataStructureExclusively(TableStructureWriteLockHolder & lock_holder, const String & query_id)
 {
    if (!lock_holder.alter_intention_lock)
        throw Exception("Alter intention lock for table " + getStorageID().getNameForLogs() + " was not taken. This is a bug.", ErrorCodes::LOGICAL_ERROR);
    lock_holder.new_data_structure_lock = new_data_structure_lock->getLock(RWLockImpl::Write, query_id);
 }
 void IStorage::lockStructureExclusively(TableStructureWriteLockHolder & lock_holder, const String & query_id)
 {
-    if (!lock_holder.alter_intention_lock)
+    if (!lock_holder.alter_lock)
        throw Exception("Alter intention lock for table " + getStorageID().getNameForLogs() + " was not taken. This is a bug.", ErrorCodes::LOGICAL_ERROR);
    if (!lock_holder.new_data_structure_lock)
        lock_holder.new_data_structure_lock = new_data_structure_lock->getLock(RWLockImpl::Write, query_id);
    lock_holder.structure_lock = structure_lock->getLock(RWLockImpl::Write, query_id);
 }
 TableStructureWriteLockHolder IStorage::lockExclusively(const String & query_id)
 {
    TableStructureWriteLockHolder result;
-    result.alter_intention_lock = alter_intention_lock->getLock(RWLockImpl::Write, query_id);
+    result.alter_lock = std::unique_lock(alter_lock);
    if (is_dropped)
        throw Exception("Table is dropped", ErrorCodes::TABLE_IS_DROPPED);
    result.new_data_structure_lock = new_data_structure_lock->getLock(RWLockImpl::Write, query_id);
    result.structure_lock = structure_lock->getLock(RWLockImpl::Write, query_id);
    return result;
--- a/dbms/src/Storages/IStorage.h
+++ b/dbms/src/Storages/IStorage.h
@ -203,16 +203,11 @@ public:
    /// Acquire this lock if you need the table structure to remain constant during the execution of
    /// the query. If will_add_new_data is true, this means that the query will add new data to the table
    /// (INSERT or a parts merge).
-    TableStructureReadLockHolder lockStructureForShare(bool will_add_new_data, const String & query_id);
+    TableStructureReadLockHolder lockStructureForShare(const String & query_id);
    /// Acquire this lock at the start of ALTER to lock out other ALTERs and make sure that only you
    /// can modify the table structure. It can later be upgraded to the exclusive lock.
-    TableStructureWriteLockHolder lockAlterIntention(const String & query_id);
+    TableStructureWriteLockHolder lockAlterIntention();
    /// Upgrade alter intention lock and make sure that no new data is inserted into the table.
    /// This is used by the ALTER MODIFY of the MergeTree storage to consistently determine
    /// the set of parts that needs to be altered.
    void lockNewDataStructureExclusively(TableStructureWriteLockHolder & lock_holder, const String & query_id);
    /// Upgrade alter intention lock to the full exclusive structure lock. This is done by ALTER queries
    /// to ensure that no other query uses the table structure and it can be safely changed.
@ -224,8 +219,12 @@ public:
    /** Returns stage to which query is going to be processed in read() function.
      * (Normally, the function only reads the columns from the list, but in other cases,
      *  for example, the request can be partially processed on a remote server.)
      *
      * SelectQueryInfo is required since the stage can depends on the query
      * (see Distributed() engine and optimize_skip_unused_shards).
      */
-    virtual QueryProcessingStage::Enum getQueryProcessingStage(const Context &) const { return QueryProcessingStage::FetchColumns; }
+    QueryProcessingStage::Enum getQueryProcessingStage(const Context & context) const { return getQueryProcessingStage(context, {}); }
    virtual QueryProcessingStage::Enum getQueryProcessingStage(const Context &, const ASTPtr &) const { return QueryProcessingStage::FetchColumns; }
    /** Watch live changes to the table.
     * Accepts a list of columns to read, as well as a description of the query,
@ -465,25 +464,38 @@ public:
    /// Returns storage policy if storage supports it
    virtual StoragePolicyPtr getStoragePolicy() const { return {}; }
-    /** If it is possible to quickly determine exact number of rows in the table at this moment of time, then return it.
+    /// If it is possible to quickly determine exact number of rows in the table at this moment of time, then return it.
-     */
+    /// Used for:
    /// - Simple count() opimization
    /// - For total_rows column in system.tables
    ///
    /// Does takes underlying Storage (if any) into account.
    virtual std::optional<UInt64> totalRows() const
    {
        return {};
    }
    /// If it is possible to quickly determine exact number of bytes for the table on storage:
    /// - memory (approximated)
    /// - disk (compressed)
    ///
    /// Used for:
    /// - For total_bytes column in system.tables
    //
    /// Does not takes underlying Storage (if any) into account
    /// (since for Buffer we still need to know how much bytes it uses).
    virtual std::optional<UInt64> totalBytes() const
    {
        return {};
    }
 private:
    /// You always need to take the next three locks in this order.
    /// If you hold this lock exclusively, you can be sure that no other structure modifying queries
    /// (e.g. ALTER, DROP) are concurrently executing. But queries that only read table structure
    /// (e.g. SELECT, INSERT) can continue to execute.
-    mutable RWLock alter_intention_lock = RWLockImpl::create();
+    mutable std::mutex alter_lock;
    /// It is taken for share for the entire INSERT query and the entire merge of the parts (for MergeTree).
    /// ALTER COLUMN queries acquire an exclusive lock to ensure that no new parts with the old structure
    /// are added to the table and thus the set of parts to modify doesn't change.
    mutable RWLock new_data_structure_lock = RWLockImpl::create();
    /// Lock for the table column structure (names, types, etc.) and data path.
    /// It is taken in exclusive mode by queries that modify them (e.g. RENAME, ALTER and DROP)
--- a/dbms/src/Storages/LiveView/StorageBlocks.h
+++ b/dbms/src/Storages/LiveView/StorageBlocks.h
@ -26,7 +26,7 @@ public:
        return std::make_shared<StorageBlocks>(table_id, columns, std::move(pipes), to_stage);
    }
    std::string getName() const override { return "Blocks"; }
-    QueryProcessingStage::Enum getQueryProcessingStage(const Context & /*context*/) const override { return to_stage; }
+    QueryProcessingStage::Enum getQueryProcessingStage(const Context &, const ASTPtr &) const override { return to_stage; }
    Pipes read(
        const Names & /*column_names*/,
--- a/dbms/src/Storages/LiveView/StorageLiveView.cpp
+++ b/dbms/src/Storages/LiveView/StorageLiveView.cpp
@ -518,14 +518,11 @@ void StorageLiveView::drop()
    condition.notify_all();
 }
-void StorageLiveView::refresh(const Context & context)
+void StorageLiveView::refresh()
 {
-    auto alter_lock = lockAlterIntention(context.getCurrentQueryId());
+    std::lock_guard lock(mutex);
-    {
+    if (getNewBlocks())
-        std::lock_guard lock(mutex);
+        condition.notify_all();
        if (getNewBlocks())
            condition.notify_all();
    }
 }
 Pipes StorageLiveView::read(
--- a/dbms/src/Storages/LiveView/StorageLiveView.h
+++ b/dbms/src/Storages/LiveView/StorageLiveView.h
@ -123,7 +123,7 @@ public:
    void startup() override;
    void shutdown() override;
-    void refresh(const Context & context);
+    void refresh();
    Pipes read(
        const Names & column_names,
--- a/dbms/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/dbms/src/Storages/MergeTree/DataPartsExchange.cpp
@ -85,7 +85,7 @@ void Service::processQuery(const Poco::Net::HTMLForm & params, ReadBuffer & /*bo
    try
    {
-        auto storage_lock = data.lockStructureForShare(false, RWLockImpl::NO_QUERY);
+        auto storage_lock = data.lockStructureForShare(RWLockImpl::NO_QUERY);
        MergeTreeData::DataPartPtr part = findPart(part_name);
--- a/dbms/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/dbms/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@ -406,8 +406,8 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
    loadColumns(require_columns_checksums);
    loadChecksums(require_columns_checksums);
    calculateColumnsSizesOnDisk();
    loadIndexGranularity();
    calculateColumnsSizesOnDisk();
    loadIndex();     /// Must be called after loadIndexGranularity as it uses the value of `index_granularity`
    loadRowsCount(); /// Must be called after loadIndex() as it uses the value of `index_granularity`.
    loadPartitionAndMinMaxIndex();
--- a/Show More
+++ b/Show More